In [1]:

    
import logging
import numpy as np
import pandas as pd
root = logging.getLogger()
root.addHandler(logging.StreamHandler())
%matplotlib inline



In [2]:

    
# download from Google Drive: https://drive.google.com/open?id=0B9cazFzBtPuCSFp3YWE1V2JGdnc
from iSDM.species import IUCNSpecies
fish = IUCNSpecies(name_species='All')
fish.load_shapefile('../data/fish/FW_FISH.shp') # warning, 2GB of data will be loaded, may take a while!!









    



Enabled Shapely speedups for performance.
Loading data from: ../data/fish/FW_FISH.shp
The shapefile contains data on 12927 species areas.

Simple data exploration



In [3]:

    
fish.get_data().columns









    Out[3]:





Index(['binomial', 'category', 'citation', 'class_name', 'compiler',
       'dist_comm', 'family_nam', 'genus_name', 'geometry', 'id_no', 'island',
       'kingdom_na', 'legend', 'order_name', 'origin', 'phylum_nam',
       'presence', 'seasonal', 'shape_area', 'shape_leng', 'source',
       'species_na', 'subpop', 'subspecies', 'tax_comm', 'year'],
      dtype='object')

How many unique binomials are there?



In [4]:

    
fish_data = fish.get_data()
fish_data['binomial'].unique().size









    Out[4]:





6328

Get their names in an array:



In [5]:

    
unique_binomials = fish_data['binomial'].unique()
unique_binomials









    Out[5]:





array(['Bagarius suchus', 'Rasbora spilocerca', 'Notoglanidium pallidum',
       ..., 'Schistura procera', 'Monotrete cambodgiensis',
       'Acantopsis spectabilis'], dtype=object)



In [6]:

    
fish_data.head(10) # peak at the first 10 records









    Out[6]:






  
    
      
      binomial
      category
      citation
      class_name
      compiler
      dist_comm
      family_nam
      genus_name
      geometry
      id_no
      ...
      presence
      seasonal
      shape_area
      shape_leng
      source
      species_na
      subpop
      subspecies
      tax_comm
      year
    
  
  
    
      0
      Bagarius suchus
      NT
      Indo-Burma freshwater assessment, IUCN
      ACTINOPTERYGII
      IUCN FBU
      None
      SISORIDAE
      Bagarius
      POLYGON ((101.8125000000001 22.48333333300008,...
      181271.0
      ...
      2.0
      5.0
      49.374794
      60.288418
      Red List assessment
      suchus
      None
      None
      None
      2012.0
    
    
      1
      Rasbora spilocerca
      LC
      Indo-Burma freshwater assessment, IUCN
      ACTINOPTERYGII
      J. Scott, IUCN
      None
      CYPRINIDAE
      Rasbora
      POLYGON ((103.5121466740001 18.53992445200004,...
      181127.0
      ...
      2.0
      5.0
      8.361239
      58.345301
      Red List assessment
      spilocerca
      None
      None
      None
      2012.0
    
    
      2
      Notoglanidium pallidum
      VU
      IUCN (International Union for Conservation of ...
      ACTINOPTERYGII
      None
      None
      CLAROTEIDAE
      Notoglanidium
      POLYGON ((12.81128506100004 -4.286932711999953...
      182359.0
      ...
      1.0
      1.0
      1.524058
      10.000992
      None
      pallidum
      None
      None
      None
      0.0
    
    
      3
      Parananochromis brevirostris
      VU
      IUCN (International Union for Conservation of ...
      ACTINOPTERYGII
      None
      None
      CICHLIDAE
      Parananochromis
      (POLYGON ((12.10738288000005 1.628413222000063...
      182240.0
      ...
      2.0
      1.0
      5.563441
      30.269691
      None
      brevirostris
      None
      None
      None
      0.0
    
    
      4
      Parananochromis brevirostris
      VU
      IUCN (International Union for Conservation of ...
      ACTINOPTERYGII
      None
      None
      CICHLIDAE
      Parananochromis
      (POLYGON ((12.78953162300007 2.117309570000032...
      182240.0
      ...
      1.0
      1.0
      4.872947
      39.634665
      None
      brevirostris
      None
      None
      None
      0.0
    
    
      5
      Parananochromis brevirostris
      VU
      None
      ACTINOPTERYGII
      None
      None
      CICHLIDAE
      Parananochromis
      (POLYGON ((13.13924221400003 -0.98298000799997...
      182240.0
      ...
      1.0
      1.0
      0.366030
      6.770438
      None
      brevirostris
      None
      None
      None
      0.0
    
    
      6
      Ambassis vachellii
      LC
      H.Larson and IUCN (International Union for Con...
      ACTINOPTERYGII
      M.Raiwalui/IUCN
      None
      AMBASSIDAE
      Ambassis
      (POLYGON ((105.2625 -6.754166666999936, 105.25...
      166893.0
      ...
      1.0
      1.0
      121.742461
      1817.507950
      H.Larson
      vachellii
      None
      None
      None
      2011.0
    
    
      7
      Parasikukia maculata
      LC
      Indo-Burma freshwater assessment, IUCN
      ACTINOPTERYGII
      D. Allen, IUCN
      None
      CYPRINIDAE
      Parasikukia
      (POLYGON ((100.374432712 18.59657999700005, 10...
      181017.0
      ...
      2.0
      1.0
      12.017594
      58.052434
      Red List assessment
      maculata
      None
      None
      None
      2012.0
    
    
      8
      Parasikukia maculata
      LC
      Indo-Burma freshwater assessment, IUCN
      ACTINOPTERYGII
      D. Allen, IUCN
      None
      CYPRINIDAE
      Parasikukia
      (POLYGON ((100.8458333330001 12.69166666700005...
      181017.0
      ...
      2.0
      1.0
      4.081329
      37.348873
      C. Vidthayanon pers. comm. 2011
      maculata
      None
      None
      None
      2012.0
    
    
      9
      Parasikukia maculata
      LC
      Indo-Burma freshwater assessment, IUCN
      ACTINOPTERYGII
      IUCN FBU
      None
      CYPRINIDAE
      Parasikukia
      (POLYGON ((99.65793745300005 16.53653225300008...
      181017.0
      ...
      2.0
      5.0
      0.374677
      6.355700
      Red List assessment
      maculata
      None
      None
      None
      2012.0
    
  

10 rows × 26 columns

Sort them by their "shape_area" column, to get the biggest and smallest areas



In [7]:

    
fish_data.sort(columns='shape_area', inplace=True)









    



/home/daniela/anaconda/envs/biodiversity_py3/lib/python3.4/site-packages/ipykernel/__main__.py:1: FutureWarning: sort(columns=....) is deprecated, use sort_values(by=.....)
  if __name__ == '__main__':

Peak at the first 5 records with the smallest area



In [8]:

    
fish_data.head(5)









    Out[8]:






  
    
      
      binomial
      category
      citation
      class_name
      compiler
      dist_comm
      family_nam
      genus_name
      geometry
      id_no
      ...
      presence
      seasonal
      shape_area
      shape_leng
      source
      species_na
      subpop
      subspecies
      tax_comm
      year
    
  
  
    
      1396
      Astatotilapia burtoni
      LC
      IUCN (International Union for Conservation of ...
      ACTINOPTERYGII
      None
      None
      CICHLIDAE
      Astatotilapia
      POLYGON ((29.81538226200007 -5.175785492999978...
      60462.0
      ...
      1.0
      0.0
      0.000122
      0.060842
      None
      burtoni
      None
      None
      None
      0.0
    
    
      6610
      Channa striata
      LC
      Chaudhry S., 2009
      ACTINOPTERYGII
      Shivaji Chaudhry
      None
      CHANNIDAE
      Channa
      POLYGON ((121.2046038030001 14.44001242700006,...
      166563.0
      ...
      1.0
      4.0
      0.000242
      0.073176
      CAS 204572
      striata
      None
      None
      None
      2007.0
    
    
      6889
      Rasbora rasbora
      LC
      IUCN
      ACTINOPTERYGII
      W. Vishwanath
      None
      CYPRINIDAE
      Rasbora
      POLYGON ((97.65833333300009 16.53333333300003,...
      166440.0
      ...
      1.0
      1.0
      0.000286
      0.075311
      Fishbase, 2026
      rasbora
      None
      None
      None
      2007.0
    
    
      11988
      Puntius chola
      LC
      Dahanukar, N.
      ACTINOPTERYGII
      Dahanukar, N.
      None
      CYPRINIDAE
      Puntius
      POLYGON ((97.65833333300009 16.53333333300003,...
      166443.0
      ...
      1.0
      1.0
      0.000286
      0.075311
      accessed through GBIF data portal, NRM-Fishes,...
      chola
      None
      None
      None
      2007.0
    
    
      5382
      Pisodonophis boro
      LC
      Chaudhry S., 2009
      ACTINOPTERYGII
      Shivaji Chaudhry
      None
      OPHICHTHIDAE
      Pisodonophis
      POLYGON ((85.46407583500007 19.66257255000005,...
      166552.0
      ...
      1.0
      4.0
      0.000393
      0.101212
      FISH 387621
      boro
      None
      None
      None
      2007.0
    
  

5 rows × 26 columns

The last 5 records (biggest area)



In [9]:

    
fish_data.tail(5)









    Out[9]:






  
    
      
      binomial
      category
      citation
      class_name
      compiler
      dist_comm
      family_nam
      genus_name
      geometry
      id_no
      ...
      presence
      seasonal
      shape_area
      shape_leng
      source
      species_na
      subpop
      subspecies
      tax_comm
      year
    
  
  
    
      10436
      Rutilus rutilus
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Rutilus
      (POLYGON ((-4.770833332999928 48.5250000000000...
      19787.0
      ...
      1.0
      1.0
      2987.465593
      1978.210580
      None
      rutilus
      None
      None
      None
      0.0
    
    
      271
      Cottus confusus
      LC
      Freshwater Biodiversity Unit, IUCN
      ACTINOPTERYGII
      Phillipa Palmeirin, FBU, IUCN
      None
      COTTIDAE
      Cottus
      (POLYGON ((-167.666666666 65.79166666700007, -...
      202659.0
      ...
      2.0
      1.0
      3031.001694
      5133.731779
      Page, L.M. and Burr, B.M. 2011. Peterson Field...
      confusus
      None
      None
      None
      2012.0
    
    
      4886
      Perca fluviatilis
      LC
      None
      ACTINOPTERYGII
      None
      None
      PERCIDAE
      Perca
      (POLYGON ((-4.770833332999928 48.5250000000000...
      16580.0
      ...
      1.0
      1.0
      3365.103170
      2218.467787
      None
      fluviatilis
      None
      None
      None
      0.0
    
    
      5973
      Lota lota
      LC
      None
      ACTINOPTERYGII
      None
      None
      LOTIDAE
      Lota
      (POLYGON ((4.038374837000049 51.96308458100003...
      135675.0
      ...
      1.0
      1.0
      4264.651654
      4250.283811
      None
      lota
      None
      None
      None
      0.0
    
    
      10370
      Esox lucius
      LC
      None
      ACTINOPTERYGII
      None
      None
      ESOCIDAE
      Esox
      (POLYGON ((-4.770833332999928 48.5250000000000...
      135631.0
      ...
      1.0
      1.0
      5225.451235
      4405.111110
      None
      lucius
      None
      None
      None
      0.0
    
  

5 rows × 26 columns

Decision: "We will include all species except those that are completely extinct. For the (possibly) extant species, we will include their entire range (including polygons from which they are currently extinct) in order to cover their full potential distribution."

From IUCN, these are the codes for presence:

Extant
Probably extant
Possibly extant
Possibly extinct
Extinct
Presence uncertain

Are there species for which the presence category isn't any of the above? (the "~" is negation, so this below says "select all fish data, for which the "presence" column is NOT in [1,2,3,4,5,6])



In [10]:

    
fish_data[~fish_data.presence.isin([1,2,3,4,5,6])]









    Out[10]:






  
    
      
      binomial
      category
      citation
      class_name
      compiler
      dist_comm
      family_nam
      genus_name
      geometry
      id_no
      ...
      presence
      seasonal
      shape_area
      shape_leng
      source
      species_na
      subpop
      subspecies
      tax_comm
      year
    
  
  
    
      3269
      Acipenser fulvescens
      LC
      Freshwater Biodiversity Unit, IUCN
      ACTINOPTERYGII
      IUCN
      None
      ACIPENSERIDAE
      Acipenser
      (POLYGON ((-77.20221048999997 44.0297339540000...
      223.0
      ...
      0.0
      0.0
      0.061229
      5.069857
      Page and Burr, 1991
      fulvescens
      None
      None
      None
      2013.0
    
    
      2312
      Sicyopterus sarasini
      EN
      None
      ACTINOPTERYGII
      None
      None
      GOBIIDAE
      Sicyopterus
      (POLYGON ((165.0041666660001 -21.3374999999999...
      196370.0
      ...
      0.0
      0.0
      0.299701
      4.962775
      None
      sarasini
      None
      None
      None
      0.0
    
    
      4669
      Chanodichthys erythropterus
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Chanodichthys
      (POLYGON ((117.40221049 48.42859937900005, 117...
      166143.0
      ...
      0.0
      0.0
      0.822562
      12.134009
      None
      erythropterus
      None
      None
      None
      0.0
    
    
      11591
      Hemiculter leucisculus
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Hemiculter
      POLYGON ((117.83971049 48.88693271300008, 117....
      166193.0
      ...
      0.0
      0.0
      2.336222
      13.899461
      None
      leucisculus
      None
      None
      None
      0.0
    
    
      3292
      Microphysogobio tungtingensis
      NT
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Microphysogobio
      POLYGON ((117.83971049 48.88693271300008, 117....
      166028.0
      ...
      0.0
      0.0
      2.629233
      16.648915
      None
      tungtingensis
      None
      None
      None
      0.0
    
    
      12321
      Carassius carassius
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Carassius
      POLYGON ((91.22674221500006 48.04201999200006,...
      3849.0
      ...
      0.0
      0.0
      4.347034
      15.390500
      None
      carassius
      None
      None
      None
      0.0
    
    
      10823
      Tinca tinca
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Tinca
      POLYGON ((91.22674221500006 48.04201999200006,...
      21912.0
      ...
      0.0
      0.0
      4.347034
      15.390500
      None
      tinca
      None
      None
      None
      0.0
    
    
      1911
      Rhynchocypris czekanowskii
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Rhynchocypris
      (POLYGON ((109.5313771560001 50.52026604500003...
      135492.0
      ...
      0.0
      0.0
      4.664014
      32.817185
      None
      czekanowskii
      None
      None
      None
      0.0
    
    
      6126
      Chanodichthys mongolicus
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Chanodichthys
      POLYGON ((113.3871466740001 51.08159111800006,...
      180698.0
      ...
      0.0
      0.0
      4.793526
      23.142232
      None
      mongolicus
      None
      None
      None
      0.0
    
    
      1054
      Acipenser baerii
      EN
      None
      ACTINOPTERYGII
      None
      None
      ACIPENSERIDAE
      Acipenser
      POLYGON ((106.493408882 50.40868665900007, 106...
      244.0
      ...
      0.0
      0.0
      5.865542
      22.969322
      None
      baerii
      None
      None
      None
      0.0
    
    
      1139
      Coregonus pidschian
      LC
      None
      ACTINOPTERYGII
      None
      None
      SALMONIDAE
      Coregonus
      POLYGON ((98.97140062100004 52.13528951000006,...
      5375.0
      ...
      0.0
      0.0
      6.453679
      27.604141
      None
      pidschian
      None
      None
      None
      0.0
    
    
      3270
      Acipenser fulvescens
      LC
      NatureServe
      ACTINOPTERYGII
      Freshwater Biodiversity Unit, IUCN
      None
      ACIPENSERIDAE
      Acipenser
      (POLYGON ((-85.38110351499995 46.1002731320000...
      223.0
      ...
      0.0
      0.0
      6.720057
      22.015335
      Digital Distribution Maps of the Freshwater Fi...
      fulvescens
      None
      None
      None
      2013.0
    
    
      2349
      Agosia chrysogaster
      LC
      NatureServe
      ACTINOPTERYGII
      Freshwater Biodiversity Unit, IUCN
      None
      CYPRINIDAE
      Agosia
      POLYGON ((-109.908333334 26.96666666600004, -1...
      191246.0
      ...
      0.0
      0.0
      9.277168
      28.618570
      Digital Distribution Maps of the Freshwater Fi...
      chrysogaster
      None
      None
      None
      2013.0
    
    
      10621
      Leuciscus idus
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Leuciscus
      (POLYGON ((106.4119327120001 50.65637715700007...
      11884.0
      ...
      0.0
      0.0
      14.080754
      41.112320
      None
      idus
      None
      None
      None
      0.0
    
    
      10718
      Coregonus autumnalis
      LC
      None
      ACTINOPTERYGII
      None
      None
      SALMONIDAE
      Coregonus
      (POLYGON ((-155.875 71.18333333300006, -155.84...
      5363.0
      ...
      0.0
      0.0
      14.810125
      93.677611
      None
      autumnalis
      None
      None
      None
      0.0
    
    
      9931
      Cyprinus rubrofuscus
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Cyprinus
      (POLYGON ((113.3871466740001 51.08159111800006...
      166052.0
      ...
      0.0
      0.0
      31.514393
      66.080886
      None
      rubrofuscus
      None
      None
      None
      0.0
    
    
      12919
      Rhodeus sericeus
      LR/lc
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Rhodeus
      (POLYGON ((113.3871466740001 51.08159111800006...
      19671.0
      ...
      0.0
      0.0
      31.661029
      64.959330
      None
      sericeus
      None
      None
      None
      0.0
    
    
      10367
      Esox lucius
      LC
      None
      ACTINOPTERYGII
      None
      None
      ESOCIDAE
      Esox
      POLYGON ((106.4119327120001 50.65637715700007,...
      135631.0
      ...
      0.0
      0.0
      31.804175
      51.945832
      None
      lucius
      None
      None
      None
      0.0
    
    
      9015
      Misgurnus anguillicaudatus
      LC
      None
      ACTINOPTERYGII
      None
      None
      COBITIDAE
      Misgurnus
      (POLYGON ((113.3871466740001 51.08159111800006...
      166158.0
      ...
      0.0
      0.0
      32.143246
      63.117779
      None
      anguillicaudatus
      None
      None
      None
      0.0
    
    
      8574
      Silurus asotus
      LC
      None
      ACTINOPTERYGII
      None
      None
      SILURIDAE
      Silurus
      (POLYGON ((106.889672852 51.36189490500004, 10...
      166951.0
      ...
      0.0
      0.0
      38.260584
      73.292529
      None
      asotus
      None
      None
      None
      0.0
    
    
      4163
      Pseudorasbora parva
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Pseudorasbora
      (POLYGON ((106.889672852 51.36189490500004, 10...
      166136.0
      ...
      0.0
      0.0
      42.024757
      82.255443
      None
      parva
      None
      None
      None
      0.0
    
    
      4887
      Perca fluviatilis
      LC
      None
      ACTINOPTERYGII
      None
      None
      PERCIDAE
      Perca
      POLYGON ((100.861882527 52.06882680300004, 100...
      16580.0
      ...
      0.0
      0.0
      42.045171
      58.419062
      None
      fluviatilis
      None
      None
      None
      0.0
    
    
      1086
      Cobitis melanoleuca
      LC
      None
      ACTINOPTERYGII
      None
      None
      COBITIDAE
      Cobitis
      (POLYGON ((106.889672852 51.36189490500004, 10...
      135534.0
      ...
      0.0
      0.0
      42.179838
      84.243200
      None
      melanoleuca
      None
      None
      None
      0.0
    
    
      9419
      Rhynchocypris percnurus
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Rhynchocypris
      (POLYGON ((113.3871466740001 51.08159111800006...
      17066.0
      ...
      0.0
      0.0
      45.696883
      93.887605
      None
      percnurus
      None
      None
      None
      0.0
    
    
      10525
      Thymallus arcticus
      LC
      None
      ACTINOPTERYGII
      None
      None
      SALMONIDAE
      Thymallus
      POLYGON ((99.07571953700005 52.71329345700008,...
      135593.0
      ...
      0.0
      0.0
      48.078823
      64.797784
      None
      arcticus
      None
      None
      None
      0.0
    
    
      5967
      Lota lota
      LC
      None
      ACTINOPTERYGII
      None
      None
      LOTIDAE
      Lota
      (POLYGON ((99.07571953700005 52.71329345700008...
      135675.0
      ...
      0.0
      0.0
      82.135939
      119.112900
      None
      lota
      None
      None
      None
      0.0
    
    
      3271
      Acipenser fulvescens
      LC
      None
      ACTINOPTERYGII
      None
      None
      ACIPENSERIDAE
      Acipenser
      (POLYGON ((-112.928940924 50.22398334700006, -...
      223.0
      ...
      0.0
      0.0
      287.725875
      387.812730
      None
      fulvescens
      None
      None
      None
      0.0
    
    
      3490
      Ambassis urotaenia
      LC
      None
      ACTINOPTERYGII
      None
      None
      AMBASSIDAE
      Ambassis
      (POLYGON ((130.961285061 -1.404733954999926, 1...
      155201.0
      ...
      0.0
      0.0
      295.859696
      2415.811485
      None
      urotaenia
      None
      None
      None
      0.0
    
  

28 rows × 26 columns

Apparently there are 28 species for which the "presence" is set to 0 in some regions. Their binomials are:



In [11]:

    
fish_data[~fish_data.presence.isin([1,2,3,4,5,6])]['binomial']









    Out[11]:





3269              Acipenser fulvescens
2312              Sicyopterus sarasini
4669       Chanodichthys erythropterus
11591           Hemiculter leucisculus
3292     Microphysogobio tungtingensis
12321              Carassius carassius
10823                      Tinca tinca
1911        Rhynchocypris czekanowskii
6126          Chanodichthys mongolicus
1054                  Acipenser baerii
1139               Coregonus pidschian
3270              Acipenser fulvescens
2349               Agosia chrysogaster
10621                   Leuciscus idus
10718             Coregonus autumnalis
9931              Cyprinus rubrofuscus
12919                 Rhodeus sericeus
10367                      Esox lucius
9015        Misgurnus anguillicaudatus
8574                    Silurus asotus
4163               Pseudorasbora parva
4887                 Perca fluviatilis
1086               Cobitis melanoleuca
9419           Rhynchocypris percnurus
10525               Thymallus arcticus
5967                         Lota lota
3271              Acipenser fulvescens
3490                Ambassis urotaenia
Name: binomial, dtype: object

Actually it's 26, since "Acipenser fulvescens" has 3 separate records (polygons)

"For the (possibly) extant species, we will include their entire range (including polygons from which they are currently extinct)"

As an example, here is a species with both extant and extinct areas



In [12]:

    
fish_data[fish_data.binomial=='Acantharchus pomotis']









    Out[12]:






  
    
      
      binomial
      category
      citation
      class_name
      compiler
      dist_comm
      family_nam
      genus_name
      geometry
      id_no
      ...
      presence
      seasonal
      shape_area
      shape_leng
      source
      species_na
      subpop
      subspecies
      tax_comm
      year
    
  
  
    
      2154
      Acantharchus pomotis
      LC
      NatureServe
      ACTINOPTERYGII
      Freshwater Biodiversity Unit, IUCN
      None
      CENTRARCHIDAE
      Acantharchus
      POLYGON ((-83.63333333299994 31.23750000000007...
      201938.0
      ...
      5.0
      0.0
      0.024246
      0.796963
      Digital Distribution Maps of the Freshwater Fi...
      pomotis
      None
      None
      None
      2013.0
    
    
      2156
      Acantharchus pomotis
      LC
      None
      ACTINOPTERYGII
      None
      None
      CENTRARCHIDAE
      Acantharchus
      (POLYGON ((-83.94131181499995 32.4517130540000...
      201938.0
      ...
      1.0
      0.0
      2.006039
      18.544973
      None
      pomotis
      None
      None
      None
      0.0
    
    
      2155
      Acantharchus pomotis
      LC
      NatureServe
      ACTINOPTERYGII
      Freshwater Biodiversity Unit, IUCN
      None
      CENTRARCHIDAE
      Acantharchus
      (POLYGON ((-84.33333333299998 30.0500000000000...
      201938.0
      ...
      1.0
      0.0
      25.110455
      170.717198
      Digital Distribution Maps of the Freshwater Fi...
      pomotis
      None
      None
      None
      2013.0
    
  

3 rows × 26 columns

Plenty of columns, let's just select the 'binomial', 'presence', 'geometry', and 'shape_area' to have a clearer overview



In [13]:

    
fish_data[fish_data.binomial=='Acantharchus pomotis'][['binomial','presence', 'geometry','shape_area']]









    Out[13]:






  
    
      
      binomial
      presence
      geometry
      shape_area
    
  
  
    
      2154
      Acantharchus pomotis
      5.0
      POLYGON ((-83.63333333299994 31.23750000000007...
      0.024246
    
    
      2156
      Acantharchus pomotis
      1.0
      (POLYGON ((-83.94131181499995 32.4517130540000...
      2.006039
    
    
      2155
      Acantharchus pomotis
      1.0
      (POLYGON ((-84.33333333299998 30.0500000000000...
      25.110455

As agreed, we want to keep the first (extinct==5) polygon when there are other regions (the next two records) where the species is not extinct. There is a function that can do the filtering out in a simple way.



In [14]:

    
fish.drop_extinct_species()









    



There are currently 6328 unique species. 

Filtering out the following extinct species: ['Alburnus akili', 'Alburnus nicaeensis', 'Aphanius splendens', "Aplocheilichthys sp. nov. 'Naivasha'", 'Barbus microbarbis', 'Catostomus bernardini', 'Chasmistes muriei', 'Coregonus bezola', 'Coregonus fera', 'Coregonus gutturosus', 'Coregonus hiemalis', 'Coregonus johannae', 'Coregonus oxyrinchus', 'Coregonus restrictus', 'Cottus bendirei', 'Cottus echinatus', 'Cyprinodon arcuatus', 'Cyprinus micristius', 'Empetrichthys latos', 'Empetrichthys merriami', "Eudontomyzon sp. nov. 'migratory'", 'Fundulus albolineatus', 'Gambusia amistadensis', 'Gambusia georgei', 'Gambusia senilis', 'Gasterosteus crenobiontus', 'Gila crassicauda', 'Ictalurus pricei', 'Lepidomeda altivelis', 'Mirogrex hulensis', 'Moxostoma lacerum', 'Noturus trautmani', 'Pantanodon madagascariensis', 'Platytropius siamensis', 'Pogonichthys ciscoides', 'Prototroctes oxyrhynchus', 'Ptychochromis onilahy', 'Ptychochromoides itasy', 'Rhinichthys deaconi', 'Romanogobio antipai', 'Salmo pallaryi', 'Salmo schiefermuelleri', 'Salvelinus agassizii', 'Salvelinus neocomensis', 'Salvelinus profundus', 'Sphaerophysa dianchiensis', 'Tristramella intermedia', 'Xenocypris yunnanensis'] 

There are now 6280 unique species after dropping out extinct ones.



In [15]:

    
fish.save_data("../data/fish/selection/non_extinct.pkl", method="pickle")









    



Saved data: ../data/fish/selection/non_extinct.pkl 
Type of data: <class 'geopandas.geodataframe.GeoDataFrame'>



In [16]:

    
non_extinct_fish = fish.get_data()

Cross-check with GBIF records

How many freshwater fish observation records do we have (without any filtering)



In [17]:

    
total_records = 0
# download the file "merged.msg" from here: (My Google Drive)
# https://drive.google.com/open?id=0B9cazFzBtPuCTHcyTmVXV0pNT0k
# and place it the subfolder "selection"
# The "merged.msg" file contains all datagrames for all individual species.
for df in pd.read_msgpack("../data/fish/selection/merged.msg", iterator=True):
    total_records += df.shape[0]



In [18]:

    
total_records









    Out[18]:





4733792

1. Problematic/unavailable locality

Which species have no latitude/longitude information, and how many "observations" are there for them? What is the basis of record for such species? (Suspicion is that these are old museum/journals records)



In [19]:

    
important_columns = ['species', 'dateidentified','basisofrecord', 'verbatimlocality', 'day', 'month', 'year' ]
result_no_lat_long = pd.DataFrame(columns=important_columns)

for df in pd.read_msgpack("../data/fish/selection/merged.msg", iterator=True):
    if "decimallatitude" not in df.columns.tolist() or "decimallongitude" not in df.columns.tolist():
        common_columns = list(set(important_columns).intersection(set(df.columns.tolist())))
        result_no_lat_long = result_no_lat_long.append(df[common_columns], ignore_index=True)

How many unique species are there, without lat/lon?



In [20]:

    
result_no_lat_long['species'].unique().size









    Out[20]:





600

Warning: this does not mean that the species ONLY has such records. It could be that particular species also has records WITH latitude/longitude information.

So then what percentage of the total number of records?



In [21]:

    
(result_no_lat_long.shape[0]/total_records) * 100 # not that bad, only about 0.2%









    Out[21]:





0.16261804489931117

What about verbatim locality? Is that helpful? These records have a verbatim locality



In [22]:

    
result_no_lat_long[['species', 'verbatimlocality']][result_no_lat_long.verbatimlocality.notnull()]









    Out[22]:






  
    
      
      species
      verbatimlocality
    
  
  
    
      27
      Salmo stomachicus
      ; ; ; ; ; ; ;
    
    
      42
      Clypeobarbus bellcrossi
      Africa | Zambia | Western Province
    
    
      114
      Squalidus atromaculatus
      Hainan
    
    
      869
      Salvelinus perisii
      ; ; ; ; ; ; ;
    
    
      1285
      Barbus fritschii
      Berkana
    
    
      1290
      Barbus fritschii
      Oued Tensift
    
    
      1292
      Barbus fritschii
      Oued Za
    
    
      1293
      Barbus fritschii
      Ras-el-Ain
    
    
      1341
      Hara horai
      unspecified
    
    
      1367
      Barbus callensis
      Oued Tensift
    
    
      1368
      Barbus callensis
      Oued Tensift
    
    
      1599
      Coregonus vandesius
      ; [Scotland; U.K.]; ; ; ; ; ; Lochmaben; Dumfr...
    
    
      1708
      Barbodes wynaadensis
      Vithry [India or Pakistan]
    
    
      2066
      Barbus callensis
      Oued Tensift
    
    
      2113
      Nannocharax wittei
      Between Kermani and Kasai [Belge Congo]
    
    
      3247
      Barbus nasus
      Fes
    
    
      3248
      Barbus nasus
      Fes
    
    
      3362
      Luciobarbus brachycephalus
      Eurasia | Union Of Soviet Socialist Republics ...
    
    
      3369
      Luciobarbus brachycephalus
      Leukoran; Rec'd 24 Dec. 1885.
    
    
      3446
      Triplophysa grahami
      ; W. China; ; ; ; ; ; Yunnanfu
    
    
      3465
      Barbus petenyi
      Milcov R. at Focsani, S Moldavia;  Vrancea
    
    
      3466
      Barbus petenyi
      Cerna R. at Baile-Herculane, Banat;  Caras-Sev...
    
    
      3467
      Barbus petenyi
      Hirtibaciu R., indirect trib. to Olt R. at Moh...
    
    
      3666
      Barbus petenyi
      Croatia
    
    
      4095
      Sabanejewia bulgarica
      Confluence of Arges R. with Danube R. at Olten...
    
    
      4205
      Coregonus nilssoni
      Lake Ring, Scania
    
    
      4209
      Coregonus nilssoni
      Lake Ring, Scania
    
    
      4375
      Haplochromis xenostoma
      Lake Victoria [exact locality unknown]
    
    
      4603
      Haplochromis bartoni
      Aquarium stock; originating from Lake Victoria.
    
    
      4820
      Sabanejewia vallachica
      Milcov R. at Focsani, S Moldavia;  Vrancea
    
    
      4823
      Sabanejewia vallachica
      Ialomita R. at Crivina, N of Bucharest;  Ilfov
    
    
      6480
      Devario kakhienensis
      Phagna Dam.
    
    
      6514
      Devario browni
      ~25 km N Mae Hong Son town, on road to Chiang ...
    
    
      6515
      Devario browni
      Mae Sariang district, 20 km SE of  Mae Sariang...
    
    
      6516
      Devario browni
      ~8 km SW Mae Hong Son town, Huey Sertao, (old ...
    
    
      6517
      Devario browni
      village of Mae Sam Laep, just above Huey Khong...
    
    
      6518
      Devario browni
      ~25 km N Mae Hong Son town, on road to Chiang ...
    
    
      6519
      Devario browni
      ~35 km S Mae Hong Son town in small stream;  M...
    
    
      6520
      Devario browni
      Pong Kan Stream, ~25 km S Mae Hong Son, Pong K...
    
    
      6525
      Devario browni
      no data
    
    
      6530
      Devario browni
      no data
    
    
      6579
      Chondrostoma cyri
      R. Kurza; Rec'd. 4 Nov. 1891.
    
    
      6862
      Barbus callensis
      Oued Za
    
    
      6872
      Barbus callensis
      Qued Ksol
    
    
      6877
      Barbus callensis
      Berkare
    
    
      6885
      Barbus callensis
      [no verbatim locality data]
    
    
      6889
      Barbus callensis
      Oued Tensift
    
    
      7115
      Barbus callensis
      West Algeria
    
    
      7116
      Barbus callensis
      [no verbatim locality data]
    
    
      7117
      Barbus callensis
      West Algerian Sahara
    
    
      7415
      Synodontis omias
      [no verbatim locality data]
    
    
      7449
      Pollimyrus guttatus
      30 km East of Kribi, Cameroons

How many records with verbatim locality?



In [23]:

    
result_no_lat_long[['species', 'verbatimlocality']][result_no_lat_long.verbatimlocality.notnull()].shape[0]









    Out[23]:





52

If we group them by the basisofrecord, how many?



In [24]:

    
grouped_no_lat_lon = pd.DataFrame()
grouped_no_lat_lon['count'] = result_no_lat_long.groupby(['species', 'basisofrecord']).apply(lambda x: x['basisofrecord'].count())
grouped_no_lat_lon.head(30)









    Out[24]:






  
    
      
      
      count
    
    
      species
      basisofrecord
      
    
  
  
    
      Abactochromis labrosus
      PRESERVED_SPECIMEN
      6
    
    
      Acanthobrama microlepis
      PRESERVED_SPECIMEN
      12
    
    
      Acanthocobitis pavonacea
      PRESERVED_SPECIMEN
      1
    
    
      Acentrogobius therezieni
      PRESERVED_SPECIMEN
      9
    
    
      Acheilognathus deignani
      PRESERVED_SPECIMEN
      2
    
    
      Acheilognathus meridianus
      PRESERVED_SPECIMEN
      1
    
    
      Acrochordonichthys gyrinus
      PRESERVED_SPECIMEN
      2
    
    
      Acrossocheilus microstoma
      PRESERVED_SPECIMEN
      1
    
    
      Ailiichthys punctata
      PRESERVED_SPECIMEN
      4
    
    
      Akysis manipurensis
      PRESERVED_SPECIMEN
      4
    
    
      Akysis pictus
      PRESERVED_SPECIMEN
      4
    
    
      Akysis portellus
      PRESERVED_SPECIMEN
      1
    
    
      Alburnoides eichwaldii
      PRESERVED_SPECIMEN
      18
    
    
      Alburnoides fasciatus
      PRESERVED_SPECIMEN
      14
    
    
      Alburnoides gmelini
      PRESERVED_SPECIMEN
      4
    
    
      Alburnoides kubanicus
      PRESERVED_SPECIMEN
      5
    
    
      Alburnoides maculatus
      PRESERVED_SPECIMEN
      8
    
    
      Alburnoides rossicus
      PRESERVED_SPECIMEN
      23
    
    
      Alburnus escherichii
      PRESERVED_SPECIMEN
      4
    
    
      Alburnus filippii
      PRESERVED_SPECIMEN
      38
    
    
      Alburnus tarichi
      PRESERVED_SPECIMEN
      4
    
    
      Alosa killarnensis
      PRESERVED_SPECIMEN
      1
    
    
      Ambastaia nigrolineata
      OBSERVATION
      1
    
    
      PRESERVED_SPECIMEN
      1
    
    
      Ambastaia sidthimunki
      PRESERVED_SPECIMEN
      1
    
    
      Amblyceps carinatum
      PRESERVED_SPECIMEN
      1
    
    
      Amblyceps protentum
      PRESERVED_SPECIMEN
      1
    
    
      Anabarilius alburnops
      PRESERVED_SPECIMEN
      6
    
    
      Aphyosemion abacinum
      PRESERVED_SPECIMEN
      9
    
    
      Aphyosemion alpha
      PRESERVED_SPECIMEN
      5

Which ones have at least 50 records (more likely we need at least 100 records in total per species, but let's keep the bar low still)



In [25]:

    
grouped_no_lat_lon[grouped_no_lat_lon['count']>50]









    Out[25]:






  
    
      
      
      count
    
    
      species
      basisofrecord
      
    
  
  
    
      Aphyosemion mimbon
      PRESERVED_SPECIMEN
      61
    
    
      Barbus callensis
      PRESERVED_SPECIMEN
      122
    
    
      Barbus ciscaucasicus
      PRESERVED_SPECIMEN
      673
    
    
      Barbus fritschii
      PRESERVED_SPECIMEN
      95
    
    
      Barbus petenyi
      PRESERVED_SPECIMEN
      553
    
    
      Chondrostoma oxyrhynchum
      PRESERVED_SPECIMEN
      72
    
    
      Cobitis stephanidisi
      PRESERVED_SPECIMEN
      62
    
    
      Coregonus nilssoni
      PRESERVED_SPECIMEN
      59
    
    
      Distichodus nefasch
      PRESERVED_SPECIMEN
      54
    
    
      Haplochromis bareli
      PRESERVED_SPECIMEN
      117
    
    
      Haplochromis crocopeplus
      PRESERVED_SPECIMEN
      65
    
    
      Haplochromis dentex
      PRESERVED_SPECIMEN
      186
    
    
      Haplochromis heusinkveldi
      PRESERVED_SPECIMEN
      1062
    
    
      Haplochromis mento
      PRESERVED_SPECIMEN
      63
    
    
      Haplochromis michaeli
      PRESERVED_SPECIMEN
      173
    
    
      Haplochromis perrieri
      PRESERVED_SPECIMEN
      340
    
    
      Haplochromis pyrrhopteryx
      PRESERVED_SPECIMEN
      54
    
    
      Haplochromis tanaos
      PRESERVED_SPECIMEN
      140
    
    
      Haplochromis xenostoma
      PRESERVED_SPECIMEN
      53
    
    
      Oxynoemacheilus brandtii
      PRESERVED_SPECIMEN
      52

According to http://gbif.github.io/gbif-api/apidocs/org/gbif/api/vocabulary/BasisOfRecord.html these are different from "real" human observations. But I'm not sure what PRESERVED_SPECIMEN is exactly?

What about the year in which these observations have been recorded? For those after 1960... (note that not all records have a year or any date information)



In [26]:

    
result_no_lat_long_years = result_no_lat_long[['species','year']][result_no_lat_long.year > 1960].groupby('species')['year'].apply(lambda x:x.tolist())
pd.DataFrame(result_no_lat_long_years).head(30)









    Out[26]:






  
    
      
      year
    
    
      species
      
    
  
  
    
      Acanthobrama microlepis
      [2006.0, 2006.0, 1966.0, 1966.0, 1966.0]
    
    
      Acentrogobius therezieni
      [1963.0, 1963.0, 1963.0]
    
    
      Acrochordonichthys gyrinus
      [1995.0, 1995.0]
    
    
      Alburnoides eichwaldii
      [2006.0, 2006.0, 2006.0, 2006.0, 2006.0]
    
    
      Alburnoides fasciatus
      [2010.0, 2010.0, 2007.0, 2007.0, 2007.0, 2006....
    
    
      Alburnoides gmelini
      [2004.0, 2004.0, 2004.0, 2004.0]
    
    
      Alburnoides rossicus
      [2012.0, 2012.0, 2012.0, 2012.0]
    
    
      Alburnus escherichii
      [2006.0, 2006.0, 1990.0, 1990.0]
    
    
      Alburnus filippii
      [2012.0, 2010.0, 2006.0]
    
    
      Ambastaia nigrolineata
      [2011.0]
    
    
      Ambastaia sidthimunki
      [2007.0]
    
    
      Amblyceps protentum
      [2012.0]
    
    
      Aphyosemion abacinum
      [1976.0, 1976.0]
    
    
      Aphyosemion alpha
      [1994.0, 1993.0, 1993.0, 1993.0]
    
    
      Aphyosemion chauchei
      [1978.0, 1978.0]
    
    
      Aphyosemion congicum
      [1971.0]
    
    
      Aphyosemion exigoideum
      [1977.0, 1976.0]
    
    
      Aphyosemion mimbon
      [1976.0]
    
    
      Aphyosemion seegersi
      [1978.0, 1978.0]
    
    
      Aplocheilichthys antinorii
      [1982.0]
    
    
      Arius madagascariensis
      [2002.0, 1988.0, 1988.0, 1964.0, 1962.0, 1962.0]
    
    
      Astatoreochromis vanderhorsti
      [1992.0, 1992.0, 1992.0, 1991.0, 1983.0]
    
    
      Astatotilapia flaviijosephi
      [2002.0, 1972.0]
    
    
      Aulonocara ethelwynnae
      [1985.0, 1985.0]
    
    
      Aulonocara hansbaenschi
      [1985.0, 1985.0]
    
    
      Aulonocara korneliae
      [1985.0, 1985.0]
    
    
      Aulonocara maylandi
      [1985.0, 1984.0, 1980.0]
    
    
      Aulonocara steveni
      [1985.0, 1985.0]
    
    
      Aulonocara stonemani
      [1973.0, 1971.0, 1971.0, 1971.0]
    
    
      Barbus aliciae
      [1980.0]



In [27]:

    
pd.DataFrame(result_no_lat_long_years).shape[0]









    Out[27]:





228

228 unique species with records after 1960, but no useful locality info about them anyways. I think all records without lat/lon will need to be discarded, for the 600 species.

Further selection criteria...

2. Records with latitude/longitude: how many? how many with year>1960? year>1990? Without any date? accuracy of location?

warning: below takes long to run



In [28]:

    
import pandas as pd
important_columns1 = ['species', 'dateidentified', 'eventdate', 'basisofrecord', 'decimallatitude','decimallongitude', 'day', 'month', 'year' ]
result_with_lat_long = pd.DataFrame(columns=important_columns1)
counter = 0
for df in pd.read_msgpack("../data/fish/selection/merged.msg", iterator=True):
    counter += 1
    if (counter%100==0):
        print("Processing.. ", counter)
    if "decimallatitude" in df.columns.tolist() and "decimallongitude" in df.columns.tolist():
        common_columns = list(set(important_columns1).intersection(set(df.columns.tolist())))
        result_with_lat_long = result_with_lat_long.append(df[common_columns], ignore_index=True)









    



Processing..  100
Processing..  200
Processing..  300
Processing..  400
Processing..  500
Processing..  600
Processing..  700
Processing..  800
Processing..  900
Processing..  1000
Processing..  1100
Processing..  1200
Processing..  1300
Processing..  1400
Processing..  1500
Processing..  1600
Processing..  1700
Processing..  1800
Processing..  1900
Processing..  2000
Processing..  2100
Processing..  2200
Processing..  2300
Processing..  2400
Processing..  2500
Processing..  2600
Processing..  2700
Processing..  2800
Processing..  2900
Processing..  3000
Processing..  3100
Processing..  3200
Processing..  3300
Processing..  3400
Processing..  3500
Processing..  3600
Processing..  3700
Processing..  3800
Processing..  3900
Processing..  4000
Processing..  4100
Processing..  4200
Processing..  4300
Processing..  4400
Processing..  4500
Processing..  4600
Processing..  4700
Processing..  4800
Processing..  4900
Processing..  5000
Processing..  5100
Processing..  5200
Processing..  5300
Processing..  5400
Processing..  5500
Processing..  5600
Processing..  5700



In [29]:

    
result_with_lat_long = result_with_lat_long[result_with_lat_long.decimallatitude.notnull() & result_with_lat_long.decimallongitude.notnull()]



In [30]:

    
result_with_lat_long.shape[0] # this-many occurrence records









    Out[30]:





3827182



In [31]:

    
result_with_lat_long.shape[0]/ total_records * 100 # percentage of records out of *ALL* species records









    Out[31]:





80.84812344944604

How many unique species have occurrence records with latitude/longitude?



In [32]:

    
result_with_lat_long['species'].unique().size









    Out[32]:





5242

What percentage of the occurrence records HAVE latitude/longitude, but NO event date?



In [33]:

    
result_with_lat_long_no_date = result_with_lat_long[(result_with_lat_long.eventdate.isnull()) & (result_with_lat_long.year.isnull())]



In [34]:

    
result_with_lat_long_no_date.shape[0]/result_with_lat_long.shape[0] * 100 # 12%









    Out[34]:





11.751805897916535

Best to take into account all observations which have either "year" or "eventdate" present. (or both) Let's group them by species name, and count the number of observation records.



In [35]:

    
grouped_lat_long_year_or_eventdate = pd.DataFrame()
grouped_lat_long_year_or_eventdate['count'] = result_with_lat_long[result_with_lat_long.eventdate.notnull() | result_with_lat_long.year.notnull()].groupby(['species']).apply(lambda x: x['species'].count())
grouped_lat_long_year_or_eventdate.head(10) # peak at the top 10 only









    Out[35]:






  
    
      
      count
    
    
      species
      
    
  
  
    
      Aaptosyax grypus
      2
    
    
      Aborichthys elongatus
      1
    
    
      Abramis brama
      114212
    
    
      Acantharchus pomotis
      477
    
    
      Acanthobrama centisquama
      1
    
    
      Acanthobrama lissneri
      58
    
    
      Acanthobrama marmid
      18
    
    
      Acanthobrama telavivensis
      39
    
    
      Acanthobrama terraesanctae
      11
    
    
      Acanthobrama tricolor
      1

Notice that some of them have very few observations. We will filter them out later.

How many unique species HAVE records with latitude/longitude, AND date of event (at least year)



In [36]:

    
grouped_lat_long_year_or_eventdate.shape[0]









    Out[36]:





4847

What percentage of observations is that?



In [37]:

    
100 * result_with_lat_long[result_with_lat_long.eventdate.notnull() | result_with_lat_long.year.notnull()].shape[0] / result_with_lat_long.shape[0]









    Out[37]:





88.24819410208346

How many unique species with latitude/longitude, AND event date after 1960?



In [38]:

    
year_or_eventdate_1960 = result_with_lat_long[['species', 'year', 'eventdate']][(result_with_lat_long.year>1960) | (result_with_lat_long.eventdate>"1960")]

grouped_year_or_eventdate_1960 = pd.DataFrame()
grouped_year_or_eventdate_1960['numobservations'] = year_or_eventdate_1960.groupby(['species']).apply(lambda x: x['species'].count())
grouped_year_or_eventdate_1960.shape[0]









    Out[38]:





4613

What percentage of observations is that? (out of all records with latitude/longitude)?



In [39]:

    
year_or_eventdate_1960.shape[0]/result_with_lat_long.shape[0] * 100









    Out[39]:





83.01737414107822

From these above, how many species have 50+ observations?



In [40]:

    
grouped_year_or_eventdate_1960[grouped_year_or_eventdate_1960.numobservations>=50]









    Out[40]:






  
    
      
      numobservations
    
    
      species
      
    
  
  
    
      Abramis brama
      113700
    
    
      Acantharchus pomotis
      463
    
    
      Acanthogobius flavimanus
      662
    
    
      Acheilognathus macropterus
      94
    
    
      Achondrostoma arcasii
      3113
    
    
      Acipenser brevirostrum
      121
    
    
      Acipenser fulvescens
      169
    
    
      Acipenser oxyrinchus
      278
    
    
      Acipenser sturio
      67
    
    
      Acipenser transmontanus
      273
    
    
      Acrocheilus alutaceus
      162
    
    
      Agonostomus monticola
      526
    
    
      Agosia chrysogaster
      272
    
    
      Alburnus alburnus
      14827
    
    
      Alburnus neretvae
      52
    
    
      Aldrichetta forsteri
      1221
    
    
      Alestes ansorgii
      78
    
    
      Alestes baremoze
      123
    
    
      Alestes dentex
      63
    
    
      Alestes macrophthalmus
      137
    
    
      Alosa aestivalis
      1510
    
    
      Alosa alabamae
      334
    
    
      Alosa alosa
      344
    
    
      Alosa fallax
      16675
    
    
      Alosa mediocris
      112
    
    
      Alosa pseudoharengus
      7625
    
    
      Alosa sapidissima
      2276
    
    
      Altolamprologus compressiceps
      73
    
    
      Ambassis ambassis
      73
    
    
      Ambassis gymnocephalus
      165
    
    
      ...
      ...
    
    
      Thymallus arcticus
      1509
    
    
      Thymallus thymallus
      5864
    
    
      Thysochromis ansorgii
      56
    
    
      Tilapia cabrae
      72
    
    
      Tilapia cameronensis
      68
    
    
      Tilapia guineensis
      355
    
    
      Tilapia mariae
      602
    
    
      Tilapia rendalli
      1134
    
    
      Tilapia ruweti
      189
    
    
      Tilapia sparrmanii
      1921
    
    
      Tilapia tholloni
      83
    
    
      Tinca tinca
      35984
    
    
      Tor putitora
      59
    
    
      Toxotes jaculatrix
      77
    
    
      Trichopodus pectoralis
      55
    
    
      Trichopodus trichopterus
      163
    
    
      Trichopsis vittata
      138
    
    
      Trinectes maculatus
      4907
    
    
      Tropheus moorii
      149
    
    
      Tylochromis lateralis
      58
    
    
      Typhlichthys subterraneus
      89
    
    
      Umbra limi
      1389
    
    
      Umbra pygmaea
      2692
    
    
      Varicorhinus nelspruitensis
      56
    
    
      Vimba vimba
      1440
    
    
      Xenentodon cancila
      94
    
    
      Xenentodon canciloides
      52
    
    
      Xenomystus nigri
      138
    
    
      Xenotilapia spiloptera
      67
    
    
      Zenarchopterus dispar
      71
    
  

1283 rows × 1 columns

Not that many. 1283 species.

What percentage is that (out of all records with latitude/longitude)?



In [41]:

    
(grouped_year_or_eventdate_1960[grouped_year_or_eventdate_1960.numobservations>50].numobservations.sum() / result_with_lat_long.shape[0]) * 100









    Out[41]:





81.828823400611725

So 80% of all records with latitude and longitude, are with year>1960 and more than 50 occurrences per species. But note that this still covers only 1281 uniqute species (out of 6280 that we started with)

What percentage is that (out of all records with latitude/longitude AND year>1960)?



In [42]:

    
100 * grouped_year_or_eventdate_1960[grouped_year_or_eventdate_1960.numobservations>50].numobservations.sum() / grouped_year_or_eventdate_1960.numobservations.sum()









    Out[42]:





98.724201337301551

Ok that means most (98%) species with latitude/longitude after year 1960, have more than 50 records.

If we limit to records >1990, it becomes even more worrying.



In [43]:

    
year_or_eventdate_1990 = result_with_lat_long[['species', 'year', 'eventdate', 'basisofrecord']][(result_with_lat_long.year>=1990) | (result_with_lat_long.eventdate>="1990")]

grouped_year_or_eventdate_1990 = pd.DataFrame()
grouped_year_or_eventdate_1990['numobservations'] = year_or_eventdate_1990.groupby(['species']).apply(lambda x: x['species'].count())
grouped_year_or_eventdate_1990.shape[0] # number of unique species









    Out[43]:





4037

What percentage of observations is that? (out of all records with latitude/longitude)?



In [44]:

    
year_or_eventdate_1990.shape[0]/result_with_lat_long.shape[0] * 100









    Out[44]:





61.64002652604449

From these, how many species have 50+ observations?



In [45]:

    
grouped_year_or_eventdate_1990[grouped_year_or_eventdate_1990.numobservations>=50]









    Out[45]:






  
    
      
      numobservations
    
    
      species
      
    
  
  
    
      Abramis brama
      109869
    
    
      Acantharchus pomotis
      152
    
    
      Acanthogobius flavimanus
      370
    
    
      Acheilognathus macropterus
      70
    
    
      Achondrostoma arcasii
      3113
    
    
      Acipenser fulvescens
      128
    
    
      Acipenser oxyrinchus
      137
    
    
      Acipenser sturio
      50
    
    
      Acipenser transmontanus
      218
    
    
      Acrocheilus alutaceus
      77
    
    
      Agonostomus monticola
      305
    
    
      Agosia chrysogaster
      83
    
    
      Alburnus alburnus
      13411
    
    
      Aldrichetta forsteri
      399
    
    
      Alestes ansorgii
      64
    
    
      Alestes baremoze
      52
    
    
      Alestes macrophthalmus
      90
    
    
      Alosa aestivalis
      395
    
    
      Alosa alosa
      250
    
    
      Alosa fallax
      7310
    
    
      Alosa pseudoharengus
      2407
    
    
      Alosa sapidissima
      940
    
    
      Ambassis gymnocephalus
      101
    
    
      Ambassis interrupta
      198
    
    
      Ambassis vachellii
      212
    
    
      Ambloplites ariommus
      435
    
    
      Ambloplites cavifrons
      59
    
    
      Ambloplites rupestris
      1686
    
    
      Ameiurus brunneus
      458
    
    
      Ameiurus catus
      221
    
    
      ...
      ...
    
    
      Telestes metohiensis
      58
    
    
      Telestes souffia
      136
    
    
      Telestes ukliva
      58
    
    
      Terapon jarbua
      538
    
    
      Terapon theraps
      1271
    
    
      Thaleichthys pacificus
      1012
    
    
      Thoburnia rhothoeca
      66
    
    
      Thoracochromis buysi
      72
    
    
      Thymallus arcticus
      695
    
    
      Thymallus thymallus
      4655
    
    
      Tilapia cabrae
      62
    
    
      Tilapia guineensis
      153
    
    
      Tilapia mariae
      467
    
    
      Tilapia rendalli
      554
    
    
      Tilapia ruweti
      94
    
    
      Tilapia sparrmanii
      837
    
    
      Tilapia tholloni
      67
    
    
      Tinca tinca
      33448
    
    
      Tor putitora
      57
    
    
      Trichopodus trichopterus
      106
    
    
      Trichopsis vittata
      108
    
    
      Trinectes maculatus
      2732
    
    
      Tropheus moorii
      90
    
    
      Typhlichthys subterraneus
      73
    
    
      Umbra limi
      471
    
    
      Umbra pygmaea
      2358
    
    
      Vimba vimba
      1134
    
    
      Xenentodon cancila
      63
    
    
      Xenomystus nigri
      111
    
    
      Xenotilapia spiloptera
      58
    
  

950 rows × 1 columns

Select a representative set of species for testing workflow

From meeting: The test set should include at least 1) the species for which lab test data on thermal tolerance are available and 2) species with very small and very large ranges, in order to find out whether the point sampling and modelling also works for these extremes.

The non_extinct_fish dataframe is sorted in ascending order, according to the area size. Take the last binomial.

Largest area



In [46]:

    
non_extinct_fish.tail(1).binomial









    Out[46]:





10370    Esox lucius
Name: binomial, dtype: object

See all the records(areas) for this binomial



In [47]:

    
non_extinct_fish[non_extinct_fish.binomial=="Esox lucius"]









    Out[47]:






  
    
      
      binomial
      category
      citation
      class_name
      compiler
      dist_comm
      family_nam
      genus_name
      geometry
      id_no
      ...
      presence
      seasonal
      shape_area
      shape_leng
      source
      species_na
      subpop
      subspecies
      tax_comm
      year
    
  
  
    
      10371
      Esox lucius
      LC
      NatureServe
      ACTINOPTERYGII
      Freshwater Biodiversity Unit, IUCN
      None
      ESOCIDAE
      Esox
      (POLYGON ((-100.381377156 40.84223395400005, -...
      135631.0
      ...
      1.0
      0.0
      3.550082
      31.832295
      Digital Distribution Maps of the Freshwater Fi...
      lucius
      None
      None
      None
      2013.0
    
    
      10368
      Esox lucius
      LC
      None
      ACTINOPTERYGII
      None
      None
      ESOCIDAE
      Esox
      (POLYGON ((-112.028315735 47.14668409600006, -...
      135631.0
      ...
      2.0
      1.0
      6.238672
      24.383191
      None
      lucius
      None
      None
      None
      0.0
    
    
      10367
      Esox lucius
      LC
      None
      ACTINOPTERYGII
      None
      None
      ESOCIDAE
      Esox
      POLYGON ((106.4119327120001 50.65637715700007,...
      135631.0
      ...
      0.0
      0.0
      31.804175
      51.945832
      None
      lucius
      None
      None
      None
      0.0
    
    
      10369
      Esox lucius
      LC
      None
      ACTINOPTERYGII
      None
      None
      ESOCIDAE
      Esox
      (POLYGON ((-9.20954827199995 39.39943271200008...
      135631.0
      ...
      1.0
      1.0
      57.242965
      52.589760
      None
      lucius
      None
      None
      None
      0.0
    
    
      10366
      Esox lucius
      LC
      None
      ACTINOPTERYGII
      None
      None
      ESOCIDAE
      Esox
      (POLYGON ((-98.63749999999999 47.9041666670000...
      135631.0
      ...
      1.0
      0.0
      125.347175
      344.480096
      None
      lucius
      None
      None
      None
      0.0
    
    
      10370
      Esox lucius
      LC
      None
      ACTINOPTERYGII
      None
      None
      ESOCIDAE
      Esox
      (POLYGON ((-4.770833332999928 48.5250000000000...
      135631.0
      ...
      1.0
      1.0
      5225.451235
      4405.111110
      None
      lucius
      None
      None
      None
      0.0
    
  

6 rows × 26 columns



In [48]:

    
esox_lucius = IUCNSpecies(name_species="Esox lucius")









    



Enabled Shapely speedups for performance.



In [49]:

    
esox_lucius.set_data(non_extinct_fish[non_extinct_fish.binomial=="Esox lucius"])



In [50]:

    
esox_lucius.save_shapefile("../data/fish/selection/esox_lucius")









    



Saved data: ../data/fish/selection/esox_lucius



In [51]:

    
esox_lucius.plot_species_occurrence()

One with the smallest area



In [52]:

    
non_extinct_fish.head(1).binomial









    Out[52]:





1396    Astatotilapia burtoni
Name: binomial, dtype: object

See all the records(areas) for this binomial



In [53]:

    
non_extinct_fish[non_extinct_fish.binomial=="Astatotilapia burtoni"]









    Out[53]:






  
    
      
      binomial
      category
      citation
      class_name
      compiler
      dist_comm
      family_nam
      genus_name
      geometry
      id_no
      ...
      presence
      seasonal
      shape_area
      shape_leng
      source
      species_na
      subpop
      subspecies
      tax_comm
      year
    
  
  
    
      1396
      Astatotilapia burtoni
      LC
      IUCN (International Union for Conservation of ...
      ACTINOPTERYGII
      None
      None
      CICHLIDAE
      Astatotilapia
      POLYGON ((29.81538226200007 -5.175785492999978...
      60462.0
      ...
      1.0
      0.0
      0.000122
      0.060842
      None
      burtoni
      None
      None
      None
      0.0
    
    
      1397
      Astatotilapia burtoni
      LC
      None
      ACTINOPTERYGII
      None
      None
      CICHLIDAE
      Astatotilapia
      (POLYGON ((29.30868665900005 -3.32325778499995...
      60462.0
      ...
      1.0
      0.0
      3.060698
      24.027768
      None
      burtoni
      None
      None
      None
      0.0
    
    
      1395
      Astatotilapia burtoni
      LC
      IUCN (International Union for Conservation of ...
      ACTINOPTERYGII
      None
      None
      CICHLIDAE
      Astatotilapia
      (POLYGON ((29.03575778500004 -1.75451999299997...
      60462.0
      ...
      1.0
      1.0
      9.665142
      66.983893
      None
      burtoni
      None
      None
      None
      0.0
    
  

3 rows × 26 columns



In [54]:

    
astatotilapia_burtoni = IUCNSpecies(name_species="Astatotilapia burtoni")









    



Enabled Shapely speedups for performance.



In [55]:

    
astatotilapia_burtoni.set_data(non_extinct_fish[non_extinct_fish.binomial=="Astatotilapia burtoni"])



In [56]:

    
astatotilapia_burtoni.save_shapefile("../data/fish/selection/astatotilapia_burtoni")









    



Saved data: ../data/fish/selection/astatotilapia_burtoni



In [57]:

    
astatotilapia_burtoni.plot_species_occurrence()

This below is just another way of saving the data, i.e., not in a shapefile (which produces multiple files in a separate folder), but a "pickled" data in a single file, compressed. It is usually a lot faster than saving as a shape file, when there is big amounts of data to be saved.



In [58]:

    
astatotilapia_burtoni.save_data(dir_name="../data/fish/selection/", method="pickle")









    



Saved data: ../data/fish/selection/Astatotilapia burtoni.pkl 
Type of data: <class 'geopandas.geodataframe.GeoDataFrame'>



In [59]:

    
esox_lucius.save_data(dir_name="../data/fish/selection/", method="pickle")









    



Saved data: ../data/fish/selection/Esox lucius.pkl 
Type of data: <class 'geopandas.geodataframe.GeoDataFrame'>

Since the records are individual shapes, and there could be multiple per species (binomial), let's group them by the species name, and apply a sum on the shape_area column. This will give us the total area (sum of all polygons) per-species. We want this in order to decide what our "average" species selection will be, for testing the workflow.



In [60]:

    
species_area_sum = non_extinct_fish.groupby('binomial')['shape_area'].apply(np.sum)



In [61]:

    
species_area_sum.sort(inplace=True)









    



/home/daniela/anaconda/envs/biodiversity_py3/lib/python3.4/site-packages/ipykernel/__main__.py:1: FutureWarning: sort is deprecated, use sort_values(inplace=True) for INPLACE sorting
  if __name__ == '__main__':



In [62]:

    
species_area_sum.head(10)









    Out[62]:





binomial
Stiphodon oatea             0.001221
Pelasgus epiroticus         0.002123
Salvelinus willoughbii      0.002167
Alosa killarnensis          0.002775
Coregonus danneri           0.002878
Stiphodon discotorquatus    0.003033
Salmo nigripinnis           0.003221
Salvelinus grayi            0.003221
Salmo stomachicus           0.003221
Sicyopterus rapa            0.003951
Name: shape_area, dtype: float64



In [63]:

    
species_area_sum.tail(10)









    Out[63]:





binomial
Rutilus rutilus         2997.839782
Hypomesus olidus        2999.564823
Gymnocephalus cernua    3057.031980
Cottus confusus         3060.971058
Perca fluviatilis       3422.239269
Phoxinus phoxinus       3521.155232
Pungitius pungitius     3580.720794
Thymallus arcticus      3663.143778
Lota lota               4761.657697
Esox lucius             5449.634304
Name: shape_area, dtype: float64



In [64]:

    
species_area_sum.hist(bins=100)









    Out[64]:





<matplotlib.axes._subplots.AxesSubplot at 0x7ff0bfd7fef0>

The distribution of areas (in km^2?) is exponential. The median value is rather low:



In [65]:

    
species_area_sum.median()









    Out[65]:





4.7331569142105



In [66]:

    
np.average(species_area_sum)









    Out[66]:





45.468180277109752



In [67]:

    
species_area_sum[(species_area_sum>45) & (species_area_sum<46)]









    Out[67]:





binomial
Lamprologus mocquardi         45.189511
Barbus guirali                45.277015
Mystus tengara                45.286891
Neolissochilus blanci         45.312671
Barbus wurtzi                 45.349153
Puntius brevis                45.410566
Acrocheilus alutaceus         45.433999
Clupeonella caspia            45.471927
Sicyopterus micrurus          45.491403
Stenogobius ophthalmoporus    45.508970
Belodontichthys truncatus     45.561695
Rita sacerdotum               45.578529
Parioglossus rainfordi        45.623731
Cyclocheilichthys enoplos     45.729648
Cyprinion semiplotum          45.878343
Name: shape_area, dtype: float64

This below is an interesting "average case" with 3 regions, two of which are rather small. It also has a region extending all the way into sea/ocean water



In [68]:

    
non_extinct_fish[non_extinct_fish.binomial=="Acrocheilus alutaceus"]









    Out[68]:






  
    
      
      binomial
      category
      citation
      class_name
      compiler
      dist_comm
      family_nam
      genus_name
      geometry
      id_no
      ...
      presence
      seasonal
      shape_area
      shape_leng
      source
      species_na
      subpop
      subspecies
      tax_comm
      year
    
  
  
    
      10322
      Acrocheilus alutaceus
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Acrocheilus
      (POLYGON ((-118.533976237 49.08130154100007, -...
      201940.0
      ...
      1.0
      0.0
      0.361865
      4.537151
      None
      alutaceus
      None
      None
      None
      0.0
    
    
      10320
      Acrocheilus alutaceus
      LC
      None
      ACTINOPTERYGII
      None
      None
      CYPRINIDAE
      Acrocheilus
      (POLYGON ((-120.529733955 51.43137715600005, -...
      201940.0
      ...
      1.0
      1.0
      8.364796
      37.046891
      None
      alutaceus
      None
      None
      None
      0.0
    
    
      10321
      Acrocheilus alutaceus
      LC
      NatureServe
      ACTINOPTERYGII
      Freshwater Biodiversity Unit, IUCN
      None
      CYPRINIDAE
      Acrocheilus
      (POLYGON ((-124.042233954 46.28038160500006, -...
      201940.0
      ...
      1.0
      0.0
      36.707338
      70.318100
      Digital Distribution Maps of the Freshwater Fi...
      alutaceus
      None
      None
      None
      2013.0
    
  

3 rows × 26 columns



In [69]:

    
acrocheilus_alutaceus = IUCNSpecies(name_species="Acrocheilus alutaceus")









    



Enabled Shapely speedups for performance.



In [70]:

    
acrocheilus_alutaceus.set_data(non_extinct_fish[non_extinct_fish.binomial=="Acrocheilus alutaceus"])



In [71]:

    
acrocheilus_alutaceus.plot_species_occurrence()



In [72]:

    
acrocheilus_alutaceus.save_data(dir_name="../data/fish/selection/", method="pickle")









    



Saved data: ../data/fish/selection/Acrocheilus alutaceus.pkl 
Type of data: <class 'geopandas.geodataframe.GeoDataFrame'>



In [73]:

    
acrocheilus_alutaceus.save_shapefile("../data/fish/selection/acrocheilus_alutaceus")









    



Saved data: ../data/fish/selection/acrocheilus_alutaceus

The individual polygons are below. They are also "not valid" geometries, makes them interesting for case study.



In [74]:

    
non_extinct_fish.loc[10322].geometry









    Out[74]:



In [75]:

    
non_extinct_fish.loc[10320].geometry









    



Ring Self-intersection at or near point -124.46249999999998 53.175000000000068
Ring Self-intersection at or near point -124.46249999999998 53.175000000000068






    Out[75]:



In [76]:

    
non_extinct_fish.loc[10321].geometry









    



Ring Self-intersection at or near point -123.34583333399996 45.416666666000026
Ring Self-intersection at or near point -123.34583333399996 45.416666666000026






    Out[76]:



In [77]:

    
non_extinct_binomials = non_extinct_fish.binomial.unique().tolist()

Just persist on storage the list of non-extinct binomials we got from IUCN, so we don't have to filter out again.



In [78]:

    
import pickle
pickle.dump(non_extinct_binomials, open("../data/fish/selection/non_extinct_binomials.pkl","wb"))



In [79]:

    
non_extinct_binomials.index("Perca fluviatilis")









    Out[79]:





5665

Let's read Aafke's Excel with lab test data on thermal tolerance for species



In [80]:

    
thermal_tolerance_df = pd.read_excel("../data/fish/selection/Lethal_temperature_freshwater_fish_July2016.xlsx")
thermal_tolerance_df.head(10)









    Out[80]:






  
    
      
      Species
      CTmax.20
      LTmax.20
      mean
    
  
  
    
      0
      Abudefduf saxatilis
      36.7
      -
      36.70
    
    
      1
      Abudefduf troschelii
      36.1
      -
      36.10
    
    
      2
      Acipenser brevirostrum
      33.7
      -
      33.70
    
    
      3
      Agosia chrysogaster
      -
      36.4
      36.40
    
    
      4
      Alosa pseudoharengus
      32.4
      -
      32.40
    
    
      5
      Ameiurus melas
      35.9
      -
      35.90
    
    
      6
      Ameiurus natalis
      35.7
      36
      35.85
    
    
      7
      Apogon dovii
      34.7
      -
      34.70
    
    
      8
      Apogon maculatus
      35
      -
      35.00
    
    
      9
      Apogon novemfasciatus
      35.2
      -
      35.20



In [81]:

    
thermal_tolerance_df.columns









    Out[81]:





Index(['Species ', 'CTmax.20 ', 'LTmax.20 ', 'mean'], dtype='object')



In [82]:

    
lab_data_list = thermal_tolerance_df['Species '].tolist()



In [83]:

    
species_with_lat_lon_after_1960 = year_or_eventdate_1960['species'].unique().tolist()

For every species that is in the lab data list, select it if it is also in the IUCN list of non-extinct binomials, AND in the GBIF filtered-out list of species with latitude/longitude information and event year > 1960:



In [84]:

    
filtered_list = []
for species_name in lab_data_list:
    if species_name.strip() in non_extinct_binomials and species_name.strip() in species_with_lat_lon_after_1960:
        filtered_list.append(species_name.strip()) # strip() is just to remove spaces in names

Now get the number of point records for this list of lab species (cross-checked with filtered GBIF records)



In [85]:

    
year_or_eventdate_1960[year_or_eventdate_1960.species.isin(filtered_list)].groupby('species')['species'].apply(lambda x: x.count())









    Out[85]:





species
Acipenser brevirostrum            121
Agosia chrysogaster               272
Alosa pseudoharengus             7625
Ameiurus melas                   3352
Ameiurus natalis                 5372
Bathygobius fuscus                462
Campostoma anomalum             10821
Carassius auratus                7507
Catostomus clarkii                134
Catostomus commersonii           8414
Catostomus latipinnis             202
Catostomus platyrhynchus          343
Catostomus snyderi                 86
Chasmistes brevirostris           328
Cirrhinus mrigala                  11
Coregonus lavaretus              4889
Cottus carolinae                 3465
Cottus cognatus                  1136
Cottus hypselurus                  75
Cottus tallapoosae                 93
Cyprinella lutrensis             9173
Cyprinodon elegans                 27
Cyprinodon macularius             138
Cyprinodon rubrofluviatilis       430
Cyprinodon variegatus           24626
Cyprinus carpio                 60722
Ericymba buccata                 2542
Etheostoma blennioides           4557
Etheostoma caeruleum             4871
Etheostoma flabellare            4065
                                ...  
Meda fulgida                       49
Micropterus dolomieu             6377
Micropterus salmoides           17941
Neogobius melanostomus           2803
Nocomis biguttatus               1313
Notemigonus crysoleucas          7345
Notropis buccula                   48
Notropis cummingsae               768
Notropis dorsalis                 789
Notropis girardi                  237
Notropis lutipinnis               683
Notropis nubilus                  878
Notropis oxyrhynchus               55
Notropis stramineus              5591
Noturus exilis                    882
Oncorhynchus gilae                  8
Pangasius pangasius                 8
Perca fluviatilis              168739
Pimephales notatus               9828
Pimephales promelas              6089
Pimephales vigilax              10574
Plagopterus argentissimus          42
Rhinichthys cobitis                46
Rhinichthys osculus              1764
Salmo salar                     59658
Salmo trutta                   169571
Salvelinus confluentus            521
Semotilus atromaculatus         11320
Thymallus arcticus               1509
Xyrauchen texanus                  31
Name: species, dtype: int64



In [86]:

    
tmp_series = year_or_eventdate_1960[year_or_eventdate_1960.species.isin(filtered_list)].groupby('species')['species'].apply(lambda x: x.count())



In [87]:

    
tmp_series[tmp_series>100] # species with more than 50 records









    Out[87]:





species
Acipenser brevirostrum            121
Agosia chrysogaster               272
Alosa pseudoharengus             7625
Ameiurus melas                   3352
Ameiurus natalis                 5372
Bathygobius fuscus                462
Campostoma anomalum             10821
Carassius auratus                7507
Catostomus clarkii                134
Catostomus commersonii           8414
Catostomus latipinnis             202
Catostomus platyrhynchus          343
Chasmistes brevirostris           328
Coregonus lavaretus              4889
Cottus carolinae                 3465
Cottus cognatus                  1136
Cyprinella lutrensis             9173
Cyprinodon macularius             138
Cyprinodon rubrofluviatilis       430
Cyprinodon variegatus           24626
Cyprinus carpio                 60722
Ericymba buccata                 2542
Etheostoma blennioides           4557
Etheostoma caeruleum             4871
Etheostoma flabellare            4065
Etheostoma nigrum                5165
Etheostoma spectabile            3969
Fundulus notatus                 3141
Fundulus olivaceus               7244
Fundulus sciadicus                176
                                ...  
Lepomis cyanellus               14950
Lepomis gibbosus                13327
Lepomis humilis                  3545
Lepomis macrochirus             22761
Lepomis megalotis               16254
Luxilus chrysocephalus           7882
Luxilus cornutus                 3154
Luxilus zonatus                   402
Micropterus dolomieu             6377
Micropterus salmoides           17941
Neogobius melanostomus           2803
Nocomis biguttatus               1313
Notemigonus crysoleucas          7345
Notropis cummingsae               768
Notropis dorsalis                 789
Notropis girardi                  237
Notropis lutipinnis               683
Notropis nubilus                  878
Notropis stramineus              5591
Noturus exilis                    882
Perca fluviatilis              168739
Pimephales notatus               9828
Pimephales promelas              6089
Pimephales vigilax              10574
Rhinichthys osculus              1764
Salmo salar                     59658
Salmo trutta                   169571
Salvelinus confluentus            521
Semotilus atromaculatus         11320
Thymallus arcticus               1509
Name: species, dtype: int64

So this is our potential list to choose a representative example from



In [88]:

    
tmp_series[tmp_series>100].keys()









    Out[88]:





Index(['Acipenser brevirostrum', 'Agosia chrysogaster', 'Alosa pseudoharengus',
       'Ameiurus melas', 'Ameiurus natalis', 'Bathygobius fuscus',
       'Campostoma anomalum', 'Carassius auratus', 'Catostomus clarkii',
       'Catostomus commersonii', 'Catostomus latipinnis',
       'Catostomus platyrhynchus', 'Chasmistes brevirostris',
       'Coregonus lavaretus', 'Cottus carolinae', 'Cottus cognatus',
       'Cyprinella lutrensis', 'Cyprinodon macularius',
       'Cyprinodon rubrofluviatilis', 'Cyprinodon variegatus',
       'Cyprinus carpio', 'Ericymba buccata', 'Etheostoma blennioides',
       'Etheostoma caeruleum', 'Etheostoma flabellare', 'Etheostoma nigrum',
       'Etheostoma spectabile', 'Fundulus notatus', 'Fundulus olivaceus',
       'Fundulus sciadicus', 'Fundulus zebrinus', 'Gambusia affinis',
       'Gambusia holbrooki', 'Gila robusta', 'Gobio gobio',
       'Ictalurus punctatus', 'Labidesthes sicculus', 'Lepidomeda mollispinis',
       'Lepomis cyanellus', 'Lepomis gibbosus', 'Lepomis humilis',
       'Lepomis macrochirus', 'Lepomis megalotis', 'Luxilus chrysocephalus',
       'Luxilus cornutus', 'Luxilus zonatus', 'Micropterus dolomieu',
       'Micropterus salmoides', 'Neogobius melanostomus', 'Nocomis biguttatus',
       'Notemigonus crysoleucas', 'Notropis cummingsae', 'Notropis dorsalis',
       'Notropis girardi', 'Notropis lutipinnis', 'Notropis nubilus',
       'Notropis stramineus', 'Noturus exilis', 'Perca fluviatilis',
       'Pimephales notatus', 'Pimephales promelas', 'Pimephales vigilax',
       'Rhinichthys osculus', 'Salmo salar', 'Salmo trutta',
       'Salvelinus confluentus', 'Semotilus atromaculatus',
       'Thymallus arcticus'],
      dtype='object', name='species')



In [89]:

    
len(tmp_series[tmp_series>100].keys())









    Out[89]:





68



In [90]:

    
len(filtered_list) # so 20 records are out of the original list because of not enough point-records









    Out[90]:





88



In [91]:

    
tmp_series[tmp_series>100].sort_values()









    Out[91]:





species
Lepidomeda mollispinis            103
Acipenser brevirostrum            121
Catostomus clarkii                134
Cyprinodon macularius             138
Fundulus sciadicus                176
Catostomus latipinnis             202
Gila robusta                      224
Notropis girardi                  237
Agosia chrysogaster               272
Chasmistes brevirostris           328
Catostomus platyrhynchus          343
Luxilus zonatus                   402
Cyprinodon rubrofluviatilis       430
Bathygobius fuscus                462
Salvelinus confluentus            521
Notropis lutipinnis               683
Notropis cummingsae               768
Notropis dorsalis                 789
Notropis nubilus                  878
Noturus exilis                    882
Cottus cognatus                  1136
Nocomis biguttatus               1313
Thymallus arcticus               1509
Fundulus zebrinus                1531
Rhinichthys osculus              1764
Ericymba buccata                 2542
Neogobius melanostomus           2803
Fundulus notatus                 3141
Luxilus cornutus                 3154
Ameiurus melas                   3352
                                ...  
Ameiurus natalis                 5372
Notropis stramineus              5591
Pimephales promelas              6089
Micropterus dolomieu             6377
Labidesthes sicculus             7146
Fundulus olivaceus               7244
Notemigonus crysoleucas          7345
Carassius auratus                7507
Alosa pseudoharengus             7625
Luxilus chrysocephalus           7882
Ictalurus punctatus              8017
Catostomus commersonii           8414
Cyprinella lutrensis             9173
Gambusia holbrooki               9319
Pimephales notatus               9828
Pimephales vigilax              10574
Campostoma anomalum             10821
Semotilus atromaculatus         11320
Lepomis gibbosus                13327
Lepomis cyanellus               14950
Gambusia affinis                15804
Lepomis megalotis               16254
Micropterus salmoides           17941
Lepomis macrochirus             22761
Cyprinodon variegatus           24626
Salmo salar                     59658
Cyprinus carpio                 60722
Gobio gobio                     72019
Perca fluviatilis              168739
Salmo trutta                   169571
Name: species, dtype: int64

Get the GBIF/IUCN data on the first and the last species in the sorted list. That would be our representative choise for testing workflow.



In [93]:

    
lepidomeda_mollispinis = IUCNSpecies(name_species="Lepidomeda mollispinis")
lepidomeda_mollispinis.set_data(non_extinct_fish[non_extinct_fish.binomial=="Lepidomeda mollispinis"])
lepidomeda_mollispinis.save_shapefile("../data/fish/selection/lepidomeda_mollispinis")
lepidomeda_mollispinis.plot_species_occurrence()

from iSDM.species import GBIFSpecies
my_species = GBIFSpecies(name_species="Lepidomeda mollispinis")
# download point-records on these species from: https://drive.google.com/open?id=0B9cazFzBtPuCMGlLMnQzb3hsQm8
data = my_species.load_data("../data/fish/selection/Lepidomeda mollispinis2361895.pkl")
my_species.plot_species_occurrence()









    



Enabled Shapely speedups for performance.
Saved data: ../data/fish/selection/lepidomeda_mollispinis 






    












    



Enabled Shapely speedups for performance.
Loading data from: ../data/fish/selection/Lepidomeda mollispinis2361895.pkl
Succesfully loaded previously saved data.
Data geometrized: converted into GeoPandas dataframe.
Points with NaN coordinates ignored.



In [94]:

    
salmo_trutta = IUCNSpecies(name_species="Salmo trutta")
salmo_trutta.set_data(non_extinct_fish[non_extinct_fish.binomial=="Salmo trutta"])
salmo_trutta.save_shapefile("../data/fish/selection/salmo_trutta")
salmo_trutta.plot_species_occurrence()

my_species = GBIFSpecies(name_species="Salmo trutta")
# download point-records on these species from: https://drive.google.com/open?id=0B9cazFzBtPuCWEIySU5oU2ZfT2M 
data = my_species.load_data("../data/fish/selection/Salmo trutta8215487.pkl")
my_species.plot_species_occurrence() # warning: a lot of point-records, may take a while!!









    



Enabled Shapely speedups for performance.
Saved data: ../data/fish/selection/salmo_trutta 






    












    



Enabled Shapely speedups for performance.
Loading data from: ../data/fish/selection/Salmo trutta8215487.pkl
Succesfully loaded previously saved data.
Data geometrized: converted into GeoPandas dataframe.
Points with NaN coordinates ignored.

Interesting, lots of point-records outside the expert range? in particular in the US.

Let's overlay the point-records with the range-maps. This will filter-out only the point records that belong to the rangemap area.

my_species contains the GBIF records, salmo_trutta contains the geometries.



In [95]:

    
my_species.overlay(salmo_trutta)









    



Overlayed species occurrence data with the given range map.



In [ ]:

    
my_species.get_data()



In [96]:

    
my_species.plot_species_occurrence()



In [110]:

    
result_with_lat_long[result_with_lat_long.species=='Esox lucius'][result_with_lat_long.year>1960]









    



/home/daniela/anaconda/envs/biodiversity_py3/lib/python3.4/site-packages/ipykernel/__main__.py:1: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
  if __name__ == '__main__':






    Out[110]:






  
    
      
      basisofrecord
      dateidentified
      day
      decimallatitude
      decimallongitude
      eventdate
      month
      species
      year
    
  
  
    
      3201738
      HUMAN_OBSERVATION
      2016-02-20T22:23:11.000+0000
      20.0
      43.64776
      -73.21035
      2016-02-19T23:00:00.000+0000
      2.0
      Esox lucius
      2016.0
    
    
      3201739
      HUMAN_OBSERVATION
      2016-02-14T22:57:42.000+0000
      14.0
      43.64294
      -73.21495
      2016-02-13T23:00:00.000+0000
      2.0
      Esox lucius
      2016.0
    
    
      3201740
      HUMAN_OBSERVATION
      2016-03-15T19:00:38.000+0000
      15.0
      41.39168
      -88.16611
      2016-03-15T17:53:12.000+0000
      3.0
      Esox lucius
      2016.0
    
    
      3201741
      HUMAN_OBSERVATION
      2016-04-18T22:00:00.000+0000
      19.0
      52.23420
      4.95997
      2016-04-19T18:06:00.000+0000
      4.0
      Esox lucius
      2016.0
    
    
      3201742
      HUMAN_OBSERVATION
      NaN
      13.0
      60.20395
      5.46997
      2016-04-12T22:00:00.000+0000
      4.0
      Esox lucius
      2016.0
    
    
      3201743
      HUMAN_OBSERVATION
      NaN
      24.0
      58.49895
      8.76855
      2016-04-23T22:00:00.000+0000
      4.0
      Esox lucius
      2016.0
    
    
      3201744
      HUMAN_OBSERVATION
      2016-04-10T07:58:30.000+0000
      9.0
      46.01636
      11.27527
      2016-04-08T22:00:00.000+0000
      4.0
      Esox lucius
      2016.0
    
    
      3201745
      HUMAN_OBSERVATION
      NaN
      31.0
      59.37117
      10.88093
      2016-05-30T22:00:00.000+0000
      5.0
      Esox lucius
      2016.0
    
    
      3201746
      HUMAN_OBSERVATION
      NaN
      22.0
      60.68136
      11.98389
      2016-05-21T22:00:00.000+0000
      5.0
      Esox lucius
      2016.0
    
    
      3201747
      HUMAN_OBSERVATION
      NaN
      22.0
      59.88509
      11.13358
      2016-05-21T22:00:00.000+0000
      5.0
      Esox lucius
      2016.0
    
    
      3201748
      HUMAN_OBSERVATION
      2016-05-06T22:00:00.000+0000
      7.0
      46.78720
      13.61220
      2016-05-07T10:02:00.000+0000
      5.0
      Esox lucius
      2016.0
    
    
      3201749
      HUMAN_OBSERVATION
      2016-05-29T08:50:22.000+0000
      28.0
      51.54395
      5.26373
      2016-05-28T08:02:58.000+0000
      5.0
      Esox lucius
      2016.0
    
    
      3201750
      HUMAN_OBSERVATION
      2016-05-06T22:00:00.000+0000
      7.0
      52.32960
      4.66999
      2016-05-07T09:36:00.000+0000
      5.0
      Esox lucius
      2016.0
    
    
      3201751
      HUMAN_OBSERVATION
      2015-02-02T09:39:54.000+0000
      9.0
      53.99756
      81.29393
      2015-01-08T23:00:00.000+0000
      1.0
      Esox lucius
      2015.0
    
    
      3201752
      HUMAN_OBSERVATION
      2015-02-22T21:06:11.000+0000
      21.0
      44.16222
      -73.38330
      2015-02-20T23:00:00.000+0000
      2.0
      Esox lucius
      2015.0
    
    
      3201753
      HUMAN_OBSERVATION
      2015-02-22T20:51:02.000+0000
      21.0
      43.65059
      -73.20540
      2015-02-20T23:00:00.000+0000
      2.0
      Esox lucius
      2015.0
    
    
      3201754
      HUMAN_OBSERVATION
      NaN
      31.0
      56.74260
      16.30920
      2015-03-30T22:00:00.000+0000
      3.0
      Esox lucius
      2015.0
    
    
      3201755
      HUMAN_OBSERVATION
      NaN
      28.0
      63.61770
      15.61820
      2015-03-27T23:00:00.000+0000
      3.0
      Esox lucius
      2015.0
    
    
      3201756
      HUMAN_OBSERVATION
      NaN
      21.0
      59.76640
      17.56830
      2015-03-20T23:00:00.000+0000
      3.0
      Esox lucius
      2015.0
    
    
      3201757
      PRESERVED_SPECIMEN
      2015-03-26T23:00:00.000+0000
      27.0
      61.73664
      -150.90074
      2015-03-26T23:00:00.000+0000
      3.0
      Esox lucius
      2015.0
    
    
      3201758
      HUMAN_OBSERVATION
      NaN
      9.0
      56.66810
      16.29040
      2015-04-08T22:00:00.000+0000
      4.0
      Esox lucius
      2015.0
    
    
      3201759
      HUMAN_OBSERVATION
      NaN
      15.0
      60.25310
      17.70750
      2015-04-14T22:00:00.000+0000
      4.0
      Esox lucius
      2015.0
    
    
      3201760
      HUMAN_OBSERVATION
      NaN
      3.0
      56.70040
      16.28510
      2015-04-02T22:00:00.000+0000
      4.0
      Esox lucius
      2015.0
    
    
      3201761
      HUMAN_OBSERVATION
      2015-04-06T20:17:54.000+0000
      6.0
      40.27955
      -106.85029
      2015-04-05T22:00:00.000+0000
      4.0
      Esox lucius
      2015.0
    
    
      3201762
      HUMAN_OBSERVATION
      2015-04-21T22:00:00.000+0000
      22.0
      52.23420
      4.95997
      2015-04-22T17:04:00.000+0000
      4.0
      Esox lucius
      2015.0
    
    
      3201763
      HUMAN_OBSERVATION
      NaN
      9.0
      57.08160
      16.53970
      2015-04-08T22:00:00.000+0000
      4.0
      Esox lucius
      2015.0
    
    
      3201764
      HUMAN_OBSERVATION
      NaN
      10.0
      56.73870
      15.91930
      2015-04-09T22:00:00.000+0000
      4.0
      Esox lucius
      2015.0
    
    
      3201765
      HUMAN_OBSERVATION
      NaN
      9.0
      56.88990
      15.86350
      2015-04-08T22:00:00.000+0000
      4.0
      Esox lucius
      2015.0
    
    
      3201766
      HUMAN_OBSERVATION
      NaN
      14.0
      59.88308
      11.12932
      2015-05-13T22:00:00.000+0000
      5.0
      Esox lucius
      2015.0
    
    
      3201767
      PRESERVED_SPECIMEN
      2015-05-13T22:00:00.000+0000
      14.0
      61.88902
      -150.80570
      2015-05-13T22:00:00.000+0000
      5.0
      Esox lucius
      2015.0
    
    
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
    
    
      3282939
      PRESERVED_SPECIMEN
      2004-08-31T22:00:00.000+0000
      1.0
      65.37500
      -142.50833
      1961-07-31T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282940
      PRESERVED_SPECIMEN
      NaN
      21.0
      46.01786
      -89.65858
      1961-08-20T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282941
      PRESERVED_SPECIMEN
      2004-08-31T22:00:00.000+0000
      13.0
      58.45000
      -155.91667
      1961-08-12T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282942
      PRESERVED_SPECIMEN
      2004-08-31T22:00:00.000+0000
      18.0
      65.40833
      -143.55000
      1961-08-17T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282944
      PRESERVED_SPECIMEN
      NaN
      1.0
      53.75000
      -90.00000
      1961-07-31T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282946
      PRESERVED_SPECIMEN
      2004-08-31T22:00:00.000+0000
      15.0
      65.20000
      -141.71667
      1961-08-14T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282947
      HUMAN_OBSERVATION
      NaN
      2.0
      60.66667
      -115.96667
      1961-08-01T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282948
      PRESERVED_SPECIMEN
      2004-08-31T22:00:00.000+0000
      14.0
      59.75000
      -161.93333
      1961-08-13T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282949
      HUMAN_OBSERVATION
      NaN
      3.0
      58.75000
      -117.76667
      1961-08-02T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282950
      PRESERVED_SPECIMEN
      2004-08-31T22:00:00.000+0000
      4.0
      65.00000
      -141.33333
      1961-08-03T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282951
      PRESERVED_SPECIMEN
      NaN
      21.0
      46.01150
      -89.67583
      1961-08-20T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282953
      OBSERVATION
      NaN
      2.0
      51.37384
      -0.49129
      1961-08-01T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282954
      PRESERVED_SPECIMEN
      NaN
      1.0
      53.75000
      -90.00000
      1961-07-31T23:00:00.000+0000
      8.0
      Esox lucius
      1961.0
    
    
      3282956
      PRESERVED_SPECIMEN
      NaN
      7.0
      68.21700
      -135.90000
      1961-09-06T23:00:00.000+0000
      9.0
      Esox lucius
      1961.0
    
    
      3282959
      PRESERVED_SPECIMEN
      NaN
      15.0
      57.91145
      -69.04730
      1961-09-14T23:00:00.000+0000
      9.0
      Esox lucius
      1961.0
    
    
      3282961
      PRESERVED_SPECIMEN
      NaN
      7.0
      68.21700
      -135.90000
      1961-09-06T23:00:00.000+0000
      9.0
      Esox lucius
      1961.0
    
    
      3282980
      OBSERVATION
      NaN
      20.0
      51.74055
      -1.20336
      1961-12-19T23:00:00.000+0000
      12.0
      Esox lucius
      1961.0
    
    
      3282981
      HUMAN_OBSERVATION
      NaN
      NaN
      55.62881
      9.23692
      NaN
      NaN
      Esox lucius
      1961.0
    
    
      3282982
      OBSERVATION
      NaN
      NaN
      51.88537
      0.97914
      NaN
      NaN
      Esox lucius
      1961.0
    
    
      3282983
      OBSERVATION
      NaN
      NaN
      51.97516
      0.98510
      NaN
      NaN
      Esox lucius
      1961.0
    
    
      3282985
      OBSERVATION
      NaN
      NaN
      54.85545
      -4.88238
      NaN
      NaN
      Esox lucius
      1961.0
    
    
      3282986
      OBSERVATION
      NaN
      NaN
      54.25853
      -2.69086
      NaN
      NaN
      Esox lucius
      1961.0
    
    
      3282987
      HUMAN_OBSERVATION
      NaN
      NaN
      55.00006
      15.07703
      NaN
      NaN
      Esox lucius
      1961.0
    
    
      3282988
      OBSERVATION
      NaN
      NaN
      54.34625
      -3.00005
      NaN
      NaN
      Esox lucius
      1961.0
    
    
      3282989
      HUMAN_OBSERVATION
      NaN
      NaN
      55.34827
      10.65457
      NaN
      NaN
      Esox lucius
      1961.0
    
    
      3282990
      HUMAN_OBSERVATION
      NaN
      NaN
      55.69418
      12.53256
      NaN
      NaN
      Esox lucius
      1961.0
    
    
      3282991
      HUMAN_OBSERVATION
      NaN
      NaN
      55.71824
      8.60073
      NaN
      NaN
      Esox lucius
      1961.0
    
    
      3282992
      HUMAN_OBSERVATION
      NaN
      NaN
      55.08262
      10.33026
      NaN
      NaN
      Esox lucius
      1961.0
    
    
      3282993
      HUMAN_OBSERVATION
      NaN
      NaN
      55.17246
      10.33325
      NaN
      NaN
      Esox lucius
      1961.0
    
    
      3282994
      HUMAN_OBSERVATION
      NaN
      NaN
      56.34654
      9.56493
      NaN
      NaN
      Esox lucius
      1961.0
    
  

79588 rows × 9 columns



In [114]:

    
result_with_lat_long[result_with_lat_long.species=='Astatotilapia burtoni'][result_with_lat_long.year>1960]









    



/home/daniela/anaconda/envs/biodiversity_py3/lib/python3.4/site-packages/ipykernel/__main__.py:1: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
  if __name__ == '__main__':






    Out[114]:






  
    
      
      basisofrecord
      dateidentified
      day
      decimallatitude
      decimallongitude
      eventdate
      month
      species
      year
    
  
  
    
      957834
      PRESERVED_SPECIMEN
      2011-03-15T23:00:00.000+0000
      26.0
      -8.76631
      31.10692
      2011-02-25T23:00:00.000+0000
      2.0
      Astatotilapia burtoni
      2011.0
    
    
      957838
      PRESERVED_SPECIMEN
      2011-12-31T23:00:00.000+0000
      20.0
      -8.76667
      31.11667
      2008-04-19T22:00:00.000+0000
      4.0
      Astatotilapia burtoni
      2008.0
    
    
      957839
      PRESERVED_SPECIMEN
      2011-12-31T23:00:00.000+0000
      21.0
      -8.76667
      31.11667
      2008-04-20T22:00:00.000+0000
      4.0
      Astatotilapia burtoni
      2008.0
    
    
      957840
      PRESERVED_SPECIMEN
      NaN
      1.0
      29.06190
      -4.30921
      2006-12-31T23:00:00.000+0000
      1.0
      Astatotilapia burtoni
      2007.0
    
    
      957841
      PRESERVED_SPECIMEN
      NaN
      1.0
      29.06190
      -4.30921
      2006-12-31T23:00:00.000+0000
      1.0
      Astatotilapia burtoni
      2007.0
    
    
      957842
      UNKNOWN
      2006-03-07T23:00:00.000+0000
      17.0
      21.43000
      -104.82900
      2005-10-16T22:00:00.000+0000
      10.0
      Astatotilapia burtoni
      2005.0
    
    
      957843
      PRESERVED_SPECIMEN
      2005-08-09T22:00:00.000+0000
      7.0
      -8.51817
      30.48000
      2004-03-06T23:00:00.000+0000
      3.0
      Astatotilapia burtoni
      2004.0
    
    
      957844
      PRESERVED_SPECIMEN
      2010-05-30T22:00:00.000+0000
      12.0
      -8.59556
      31.18528
      2004-03-11T23:00:00.000+0000
      3.0
      Astatotilapia burtoni
      2004.0
    
    
      957845
      PRESERVED_SPECIMEN
      2007-08-15T22:00:00.000+0000
      10.0
      -8.76750
      31.11167
      2004-03-09T23:00:00.000+0000
      3.0
      Astatotilapia burtoni
      2004.0
    
    
      957846
      PRESERVED_SPECIMEN
      2007-08-12T22:00:00.000+0000
      6.0
      -8.61167
      30.73967
      2004-03-05T23:00:00.000+0000
      3.0
      Astatotilapia burtoni
      2004.0
    
    
      957847
      PRESERVED_SPECIMEN
      2010-05-30T22:00:00.000+0000
      12.0
      -8.59556
      31.18528
      2004-03-11T23:00:00.000+0000
      3.0
      Astatotilapia burtoni
      2004.0
    
    
      957848
      PRESERVED_SPECIMEN
      2007-08-12T22:00:00.000+0000
      6.0
      -8.62000
      30.72283
      2004-03-05T23:00:00.000+0000
      3.0
      Astatotilapia burtoni
      2004.0
    
    
      957849
      PRESERVED_SPECIMEN
      2004-03-11T23:00:00.000+0000
      12.0
      -8.59889
      31.18417
      2004-03-11T23:00:00.000+0000
      3.0
      Astatotilapia burtoni
      2004.0
    
    
      957850
      PRESERVED_SPECIMEN
      2010-05-30T22:00:00.000+0000
      12.0
      -8.59556
      31.18528
      2004-03-11T23:00:00.000+0000
      3.0
      Astatotilapia burtoni
      2004.0
    
    
      957851
      PRESERVED_SPECIMEN
      2000-12-31T23:00:00.000+0000
      19.0
      -8.58883
      31.18667
      2001-10-18T22:00:00.000+0000
      10.0
      Astatotilapia burtoni
      2001.0
    
    
      957852
      PRESERVED_SPECIMEN
      2000-12-31T23:00:00.000+0000
      17.0
      -8.77200
      31.13983
      2001-10-16T22:00:00.000+0000
      10.0
      Astatotilapia burtoni
      2001.0
    
    
      957853
      PRESERVED_SPECIMEN
      2000-12-31T23:00:00.000+0000
      17.0
      -8.77200
      31.13983
      2001-10-16T22:00:00.000+0000
      10.0
      Astatotilapia burtoni
      2001.0
    
    
      957869
      PRESERVED_SPECIMEN
      2002-12-31T23:00:00.000+0000
      23.0
      -9.10000
      31.48333
      1995-10-22T23:00:00.000+0000
      10.0
      Astatotilapia burtoni
      1995.0
    
    
      957870
      PRESERVED_SPECIMEN
      NaN
      30.0
      -8.76667
      31.11667
      1994-09-29T23:00:00.000+0000
      9.0
      Astatotilapia burtoni
      1994.0
    
    
      957871
      PRESERVED_SPECIMEN
      1992-12-31T23:00:00.000+0000
      23.0
      -3.33333
      29.25000
      1993-07-22T22:00:00.000+0000
      7.0
      Astatotilapia burtoni
      1993.0
    
    
      957873
      PRESERVED_SPECIMEN
      1993-12-31T23:00:00.000+0000
      27.0
      -2.53333
      30.10000
      1993-07-26T22:00:00.000+0000
      7.0
      Astatotilapia burtoni
      1993.0
    
    
      957875
      PRESERVED_SPECIMEN
      1993-12-31T23:00:00.000+0000
      27.0
      -2.53333
      30.10000
      1993-07-26T22:00:00.000+0000
      7.0
      Astatotilapia burtoni
      1993.0
    
    
      957876
      PRESERVED_SPECIMEN
      1993-12-31T23:00:00.000+0000
      27.0
      -2.53333
      30.10000
      1993-07-26T22:00:00.000+0000
      7.0
      Astatotilapia burtoni
      1993.0
    
    
      957877
      PRESERVED_SPECIMEN
      1993-12-31T23:00:00.000+0000
      26.0
      -2.53333
      30.10000
      1993-07-25T22:00:00.000+0000
      7.0
      Astatotilapia burtoni
      1993.0
    
    
      957878
      PRESERVED_SPECIMEN
      1994-12-31T23:00:00.000+0000
      20.0
      -5.21667
      29.80000
      1993-08-19T22:00:00.000+0000
      8.0
      Astatotilapia burtoni
      1993.0
    
    
      957885
      PRESERVED_SPECIMEN
      1993-12-31T23:00:00.000+0000
      20.0
      -5.21667
      29.80000
      1993-08-19T22:00:00.000+0000
      8.0
      Astatotilapia burtoni
      1993.0
    
    
      957892
      PRESERVED_SPECIMEN
      1993-12-31T23:00:00.000+0000
      11.0
      -2.45000
      30.28333
      1993-08-10T22:00:00.000+0000
      8.0
      Astatotilapia burtoni
      1993.0
    
    
      957905
      PRESERVED_SPECIMEN
      1993-12-31T23:00:00.000+0000
      30.0
      -6.59833
      30.27133
      1992-05-29T22:00:00.000+0000
      5.0
      Astatotilapia burtoni
      1992.0
    
    
      957907
      PRESERVED_SPECIMEN
      1993-12-31T23:00:00.000+0000
      30.0
      -6.59833
      30.27133
      1992-05-29T22:00:00.000+0000
      5.0
      Astatotilapia burtoni
      1992.0
    
    
      957945
      PRESERVED_SPECIMEN
      1993-12-31T23:00:00.000+0000
      29.0
      -3.86667
      29.38333
      1991-03-28T23:00:00.000+0000
      3.0
      Astatotilapia burtoni
      1991.0
    
    
      957950
      PRESERVED_SPECIMEN
      1993-12-31T23:00:00.000+0000
      15.0
      -3.13333
      29.26667
      1991-03-14T23:00:00.000+0000
      3.0
      Astatotilapia burtoni
      1991.0
    
    
      957965
      PRESERVED_SPECIMEN
      1991-12-31T23:00:00.000+0000
      13.0
      -3.08333
      29.25000
      1991-08-12T22:00:00.000+0000
      8.0
      Astatotilapia burtoni
      1991.0
    
    
      957994
      PRESERVED_SPECIMEN
      NaN
      18.0
      -8.78330
      31.13330
      1991-11-17T23:00:00.000+0000
      11.0
      Astatotilapia burtoni
      1991.0
    
    
      957995
      PRESERVED_SPECIMEN
      NaN
      15.0
      -8.75000
      31.16667
      1991-11-14T23:00:00.000+0000
      11.0
      Astatotilapia burtoni
      1991.0
    
    
      958029
      PRESERVED_SPECIMEN
      1985-12-31T23:00:00.000+0000
      8.0
      -2.20000
      30.23333
      1986-08-07T22:00:00.000+0000
      8.0
      Astatotilapia burtoni
      1986.0
    
    
      958030
      PRESERVED_SPECIMEN
      1985-12-31T23:00:00.000+0000
      8.0
      -2.20000
      30.23333
      1986-08-07T22:00:00.000+0000
      8.0
      Astatotilapia burtoni
      1986.0
    
    
      958031
      PRESERVED_SPECIMEN
      1985-12-31T23:00:00.000+0000
      15.0
      -2.25000
      30.13333
      1986-10-14T23:00:00.000+0000
      10.0
      Astatotilapia burtoni
      1986.0
    
    
      958032
      PRESERVED_SPECIMEN
      1993-12-31T23:00:00.000+0000
      27.0
      -2.20000
      30.36667
      1985-07-26T22:00:00.000+0000
      7.0
      Astatotilapia burtoni
      1985.0
    
    
      958033
      PRESERVED_SPECIMEN
      2005-12-31T23:00:00.000+0000
      23.0
      -2.46667
      30.30000
      1981-10-22T23:00:00.000+0000
      10.0
      Astatotilapia burtoni
      1981.0
    
    
      958034
      PRESERVED_SPECIMEN
      2005-12-31T23:00:00.000+0000
      1.0
      -2.46667
      30.30000
      1981-11-30T23:00:00.000+0000
      12.0
      Astatotilapia burtoni
      1981.0
    
    
      958035
      PRESERVED_SPECIMEN
      1976-12-31T23:00:00.000+0000
      1.0
      -8.51667
      30.70000
      1975-12-31T23:00:00.000+0000
      1.0
      Astatotilapia burtoni
      1976.0
    
    
      958043
      PRESERVED_SPECIMEN
      NaN
      1.0
      -8.71052
      31.11581
      1972-05-31T23:00:00.000+0000
      6.0
      Astatotilapia burtoni
      1972.0
    
    
      958047
      PRESERVED_SPECIMEN
      1976-12-31T23:00:00.000+0000
      27.0
      -8.76667
      31.11667
      1967-07-26T23:00:00.000+0000
      7.0
      Astatotilapia burtoni
      1967.0
    
    
      958054
      PRESERVED_SPECIMEN
      1965-12-31T23:00:00.000+0000
      18.0
      -8.76667
      31.11667
      1966-02-17T23:00:00.000+0000
      2.0
      Astatotilapia burtoni
      1966.0
    
    
      958057
      PRESERVED_SPECIMEN
      1965-12-31T23:00:00.000+0000
      18.0
      -8.76667
      31.11667
      1966-02-17T23:00:00.000+0000
      2.0
      Astatotilapia burtoni
      1966.0
    
    
      958063
      PRESERVED_SPECIMEN
      1976-12-31T23:00:00.000+0000
      1.0
      -3.40000
      29.13333
      1960-12-31T23:00:00.000+0000
      1.0
      Astatotilapia burtoni
      1961.0



In [115]:

    
result_with_lat_long[result_with_lat_long.species=='Astatotilapia burtoni'][result_with_lat_long.year>1960].shape









    



/home/daniela/anaconda/envs/biodiversity_py3/lib/python3.4/site-packages/ipykernel/__main__.py:1: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
  if __name__ == '__main__':






    Out[115]:





(46, 9)



In [116]:

    
result_with_lat_long[result_with_lat_long.species=='Acrocheilus alutaceus'][result_with_lat_long.year>1960].shape









    



/home/daniela/anaconda/envs/biodiversity_py3/lib/python3.4/site-packages/ipykernel/__main__.py:1: UserWarning: Boolean Series key will be reindexed to match DataFrame index.
  if __name__ == '__main__':






    Out[116]:





(158, 9)



In [ ]:

	binomial	category	citation	class_name	compiler	dist_comm	family_nam	genus_name	geometry	id_no	...	presence	seasonal	shape_area	shape_leng	source	species_na	subpop	subspecies	tax_comm	year
0	Bagarius suchus	NT	Indo-Burma freshwater assessment, IUCN	ACTINOPTERYGII	IUCN FBU	None	SISORIDAE	Bagarius	POLYGON ((101.8125000000001 22.48333333300008,...	181271.0	...	2.0	5.0	49.374794	60.288418	Red List assessment	suchus	None	None	None	2012.0
1	Rasbora spilocerca	LC	Indo-Burma freshwater assessment, IUCN	ACTINOPTERYGII	J. Scott, IUCN	None	CYPRINIDAE	Rasbora	POLYGON ((103.5121466740001 18.53992445200004,...	181127.0	...	2.0	5.0	8.361239	58.345301	Red List assessment	spilocerca	None	None	None	2012.0
2	Notoglanidium pallidum	VU	IUCN (International Union for Conservation of ...	ACTINOPTERYGII	None	None	CLAROTEIDAE	Notoglanidium	POLYGON ((12.81128506100004 -4.286932711999953...	182359.0	...	1.0	1.0	1.524058	10.000992	None	pallidum	None	None	None	0.0
3	Parananochromis brevirostris	VU	IUCN (International Union for Conservation of ...	ACTINOPTERYGII	None	None	CICHLIDAE	Parananochromis	(POLYGON ((12.10738288000005 1.628413222000063...	182240.0	...	2.0	1.0	5.563441	30.269691	None	brevirostris	None	None	None	0.0
4	Parananochromis brevirostris	VU	IUCN (International Union for Conservation of ...	ACTINOPTERYGII	None	None	CICHLIDAE	Parananochromis	(POLYGON ((12.78953162300007 2.117309570000032...	182240.0	...	1.0	1.0	4.872947	39.634665	None	brevirostris	None	None	None	0.0
5	Parananochromis brevirostris	VU	None	ACTINOPTERYGII	None	None	CICHLIDAE	Parananochromis	(POLYGON ((13.13924221400003 -0.98298000799997...	182240.0	...	1.0	1.0	0.366030	6.770438	None	brevirostris	None	None	None	0.0
6	Ambassis vachellii	LC	H.Larson and IUCN (International Union for Con...	ACTINOPTERYGII	M.Raiwalui/IUCN	None	AMBASSIDAE	Ambassis	(POLYGON ((105.2625 -6.754166666999936, 105.25...	166893.0	...	1.0	1.0	121.742461	1817.507950	H.Larson	vachellii	None	None	None	2011.0
7	Parasikukia maculata	LC	Indo-Burma freshwater assessment, IUCN	ACTINOPTERYGII	D. Allen, IUCN	None	CYPRINIDAE	Parasikukia	(POLYGON ((100.374432712 18.59657999700005, 10...	181017.0	...	2.0	1.0	12.017594	58.052434	Red List assessment	maculata	None	None	None	2012.0
8	Parasikukia maculata	LC	Indo-Burma freshwater assessment, IUCN	ACTINOPTERYGII	D. Allen, IUCN	None	CYPRINIDAE	Parasikukia	(POLYGON ((100.8458333330001 12.69166666700005...	181017.0	...	2.0	1.0	4.081329	37.348873	C. Vidthayanon pers. comm. 2011	maculata	None	None	None	2012.0
9	Parasikukia maculata	LC	Indo-Burma freshwater assessment, IUCN	ACTINOPTERYGII	IUCN FBU	None	CYPRINIDAE	Parasikukia	(POLYGON ((99.65793745300005 16.53653225300008...	181017.0	...	2.0	5.0	0.374677	6.355700	Red List assessment	maculata	None	None	None	2012.0

	binomial	category	citation	class_name	compiler	dist_comm	family_nam	genus_name	geometry	id_no	...	presence	seasonal	shape_area	shape_leng	source	species_na	subpop	subspecies	tax_comm	year
1396	Astatotilapia burtoni	LC	IUCN (International Union for Conservation of ...	ACTINOPTERYGII	None	None	CICHLIDAE	Astatotilapia	POLYGON ((29.81538226200007 -5.175785492999978...	60462.0	...	1.0	0.0	0.000122	0.060842	None	burtoni	None	None	None	0.0
6610	Channa striata	LC	Chaudhry S., 2009	ACTINOPTERYGII	Shivaji Chaudhry	None	CHANNIDAE	Channa	POLYGON ((121.2046038030001 14.44001242700006,...	166563.0	...	1.0	4.0	0.000242	0.073176	CAS 204572	striata	None	None	None	2007.0
6889	Rasbora rasbora	LC	IUCN	ACTINOPTERYGII	W. Vishwanath	None	CYPRINIDAE	Rasbora	POLYGON ((97.65833333300009 16.53333333300003,...	166440.0	...	1.0	1.0	0.000286	0.075311	Fishbase, 2026	rasbora	None	None	None	2007.0
11988	Puntius chola	LC	Dahanukar, N.	ACTINOPTERYGII	Dahanukar, N.	None	CYPRINIDAE	Puntius	POLYGON ((97.65833333300009 16.53333333300003,...	166443.0	...	1.0	1.0	0.000286	0.075311	accessed through GBIF data portal, NRM-Fishes,...	chola	None	None	None	2007.0
5382	Pisodonophis boro	LC	Chaudhry S., 2009	ACTINOPTERYGII	Shivaji Chaudhry	None	OPHICHTHIDAE	Pisodonophis	POLYGON ((85.46407583500007 19.66257255000005,...	166552.0	...	1.0	4.0	0.000393	0.101212	FISH 387621	boro	None	None	None	2007.0

	binomial	category	citation	class_name	compiler	dist_comm	family_nam	genus_name	geometry	id_no	...	presence	seasonal	shape_area	shape_leng	source	species_na	subpop	subspecies	tax_comm	year
10436	Rutilus rutilus	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Rutilus	(POLYGON ((-4.770833332999928 48.5250000000000...	19787.0	...	1.0	1.0	2987.465593	1978.210580	None	rutilus	None	None	None	0.0
271	Cottus confusus	LC	Freshwater Biodiversity Unit, IUCN	ACTINOPTERYGII	Phillipa Palmeirin, FBU, IUCN	None	COTTIDAE	Cottus	(POLYGON ((-167.666666666 65.79166666700007, -...	202659.0	...	2.0	1.0	3031.001694	5133.731779	Page, L.M. and Burr, B.M. 2011. Peterson Field...	confusus	None	None	None	2012.0
4886	Perca fluviatilis	LC	None	ACTINOPTERYGII	None	None	PERCIDAE	Perca	(POLYGON ((-4.770833332999928 48.5250000000000...	16580.0	...	1.0	1.0	3365.103170	2218.467787	None	fluviatilis	None	None	None	0.0
5973	Lota lota	LC	None	ACTINOPTERYGII	None	None	LOTIDAE	Lota	(POLYGON ((4.038374837000049 51.96308458100003...	135675.0	...	1.0	1.0	4264.651654	4250.283811	None	lota	None	None	None	0.0
10370	Esox lucius	LC	None	ACTINOPTERYGII	None	None	ESOCIDAE	Esox	(POLYGON ((-4.770833332999928 48.5250000000000...	135631.0	...	1.0	1.0	5225.451235	4405.111110	None	lucius	None	None	None	0.0

	binomial	category	citation	class_name	compiler	dist_comm	family_nam	genus_name	geometry	id_no	...	shape_area	shape_leng	source	species_na	subpop	subspecies	tax_comm	year
3269	Acipenser fulvescens	LC	Freshwater Biodiversity Unit, IUCN	ACTINOPTERYGII	IUCN	None	ACIPENSERIDAE	Acipenser	(POLYGON ((-77.20221048999997 44.0297339540000...	223.0	...	0.061229	5.069857	Page and Burr, 1991	fulvescens	None	None	None	2013.0
2312	Sicyopterus sarasini	EN	None	ACTINOPTERYGII	None	None	GOBIIDAE	Sicyopterus	(POLYGON ((165.0041666660001 -21.3374999999999...	196370.0	...	0.299701	4.962775	None	sarasini	None	None	None	0.0
4669	Chanodichthys erythropterus	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Chanodichthys	(POLYGON ((117.40221049 48.42859937900005, 117...	166143.0	...	0.822562	12.134009	None	erythropterus	None	None	None	0.0
11591	Hemiculter leucisculus	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Hemiculter	POLYGON ((117.83971049 48.88693271300008, 117....	166193.0	...	2.336222	13.899461	None	leucisculus	None	None	None	0.0
3292	Microphysogobio tungtingensis	NT	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Microphysogobio	POLYGON ((117.83971049 48.88693271300008, 117....	166028.0	...	2.629233	16.648915	None	tungtingensis	None	None	None	0.0
12321	Carassius carassius	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Carassius	POLYGON ((91.22674221500006 48.04201999200006,...	3849.0	...	4.347034	15.390500	None	carassius	None	None	None	0.0
10823	Tinca tinca	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Tinca	POLYGON ((91.22674221500006 48.04201999200006,...	21912.0	...	4.347034	15.390500	None	tinca	None	None	None	0.0
1911	Rhynchocypris czekanowskii	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Rhynchocypris	(POLYGON ((109.5313771560001 50.52026604500003...	135492.0	...	4.664014	32.817185	None	czekanowskii	None	None	None	0.0
6126	Chanodichthys mongolicus	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Chanodichthys	POLYGON ((113.3871466740001 51.08159111800006,...	180698.0	...	4.793526	23.142232	None	mongolicus	None	None	None	0.0
1054	Acipenser baerii	EN	None	ACTINOPTERYGII	None	None	ACIPENSERIDAE	Acipenser	POLYGON ((106.493408882 50.40868665900007, 106...	244.0	...	5.865542	22.969322	None	baerii	None	None	None	0.0
1139	Coregonus pidschian	LC	None	ACTINOPTERYGII	None	None	SALMONIDAE	Coregonus	POLYGON ((98.97140062100004 52.13528951000006,...	5375.0	...	6.453679	27.604141	None	pidschian	None	None	None	0.0
3270	Acipenser fulvescens	LC	NatureServe	ACTINOPTERYGII	Freshwater Biodiversity Unit, IUCN	None	ACIPENSERIDAE	Acipenser	(POLYGON ((-85.38110351499995 46.1002731320000...	223.0	...	6.720057	22.015335	Digital Distribution Maps of the Freshwater Fi...	fulvescens	None	None	None	2013.0
2349	Agosia chrysogaster	LC	NatureServe	ACTINOPTERYGII	Freshwater Biodiversity Unit, IUCN	None	CYPRINIDAE	Agosia	POLYGON ((-109.908333334 26.96666666600004, -1...	191246.0	...	9.277168	28.618570	Digital Distribution Maps of the Freshwater Fi...	chrysogaster	None	None	None	2013.0
10621	Leuciscus idus	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Leuciscus	(POLYGON ((106.4119327120001 50.65637715700007...	11884.0	...	14.080754	41.112320	None	idus	None	None	None	0.0
10718	Coregonus autumnalis	LC	None	ACTINOPTERYGII	None	None	SALMONIDAE	Coregonus	(POLYGON ((-155.875 71.18333333300006, -155.84...	5363.0	...	14.810125	93.677611	None	autumnalis	None	None	None	0.0
9931	Cyprinus rubrofuscus	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Cyprinus	(POLYGON ((113.3871466740001 51.08159111800006...	166052.0	...	31.514393	66.080886	None	rubrofuscus	None	None	None	0.0
12919	Rhodeus sericeus	LR/lc	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Rhodeus	(POLYGON ((113.3871466740001 51.08159111800006...	19671.0	...	31.661029	64.959330	None	sericeus	None	None	None	0.0
10367	Esox lucius	LC	None	ACTINOPTERYGII	None	None	ESOCIDAE	Esox	POLYGON ((106.4119327120001 50.65637715700007,...	135631.0	...	31.804175	51.945832	None	lucius	None	None	None	0.0
9015	Misgurnus anguillicaudatus	LC	None	ACTINOPTERYGII	None	None	COBITIDAE	Misgurnus	(POLYGON ((113.3871466740001 51.08159111800006...	166158.0	...	32.143246	63.117779	None	anguillicaudatus	None	None	None	0.0
8574	Silurus asotus	LC	None	ACTINOPTERYGII	None	None	SILURIDAE	Silurus	(POLYGON ((106.889672852 51.36189490500004, 10...	166951.0	...	38.260584	73.292529	None	asotus	None	None	None	0.0
4163	Pseudorasbora parva	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Pseudorasbora	(POLYGON ((106.889672852 51.36189490500004, 10...	166136.0	...	42.024757	82.255443	None	parva	None	None	None	0.0
4887	Perca fluviatilis	LC	None	ACTINOPTERYGII	None	None	PERCIDAE	Perca	POLYGON ((100.861882527 52.06882680300004, 100...	16580.0	...	42.045171	58.419062	None	fluviatilis	None	None	None	0.0
1086	Cobitis melanoleuca	LC	None	ACTINOPTERYGII	None	None	COBITIDAE	Cobitis	(POLYGON ((106.889672852 51.36189490500004, 10...	135534.0	...	42.179838	84.243200	None	melanoleuca	None	None	None	0.0
9419	Rhynchocypris percnurus	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Rhynchocypris	(POLYGON ((113.3871466740001 51.08159111800006...	17066.0	...	45.696883	93.887605	None	percnurus	None	None	None	0.0
10525	Thymallus arcticus	LC	None	ACTINOPTERYGII	None	None	SALMONIDAE	Thymallus	POLYGON ((99.07571953700005 52.71329345700008,...	135593.0	...	48.078823	64.797784	None	arcticus	None	None	None	0.0
5967	Lota lota	LC	None	ACTINOPTERYGII	None	None	LOTIDAE	Lota	(POLYGON ((99.07571953700005 52.71329345700008...	135675.0	...	82.135939	119.112900	None	lota	None	None	None	0.0
3271	Acipenser fulvescens	LC	None	ACTINOPTERYGII	None	None	ACIPENSERIDAE	Acipenser	(POLYGON ((-112.928940924 50.22398334700006, -...	223.0	...	287.725875	387.812730	None	fulvescens	None	None	None	0.0
3490	Ambassis urotaenia	LC	None	ACTINOPTERYGII	None	None	AMBASSIDAE	Ambassis	(POLYGON ((130.961285061 -1.404733954999926, 1...	155201.0	...	295.859696	2415.811485	None	urotaenia	None	None	None	0.0

	binomial	category	citation	class_name	compiler	dist_comm	family_nam	genus_name	geometry	id_no	...	presence	shape_area	shape_leng	source	species_na	subpop	subspecies	tax_comm	year
2154	Acantharchus pomotis	LC	NatureServe	ACTINOPTERYGII	Freshwater Biodiversity Unit, IUCN	None	CENTRARCHIDAE	Acantharchus	POLYGON ((-83.63333333299994 31.23750000000007...	201938.0	...	5.0	0.024246	0.796963	Digital Distribution Maps of the Freshwater Fi...	pomotis	None	None	None	2013.0
2156	Acantharchus pomotis	LC	None	ACTINOPTERYGII	None	None	CENTRARCHIDAE	Acantharchus	(POLYGON ((-83.94131181499995 32.4517130540000...	201938.0	...	1.0	2.006039	18.544973	None	pomotis	None	None	None	0.0
2155	Acantharchus pomotis	LC	NatureServe	ACTINOPTERYGII	Freshwater Biodiversity Unit, IUCN	None	CENTRARCHIDAE	Acantharchus	(POLYGON ((-84.33333333299998 30.0500000000000...	201938.0	...	1.0	25.110455	170.717198	Digital Distribution Maps of the Freshwater Fi...	pomotis	None	None	None	2013.0

	species	verbatimlocality
27	Salmo stomachicus	; ; ; ; ; ; ;
42	Clypeobarbus bellcrossi	Africa \| Zambia \| Western Province
114	Squalidus atromaculatus	Hainan
869	Salvelinus perisii	; ; ; ; ; ; ;
1285	Barbus fritschii	Berkana
1290	Barbus fritschii	Oued Tensift
1292	Barbus fritschii	Oued Za
1293	Barbus fritschii	Ras-el-Ain
1341	Hara horai	unspecified
1367	Barbus callensis	Oued Tensift
1368	Barbus callensis	Oued Tensift
1599	Coregonus vandesius	; [Scotland; U.K.]; ; ; ; ; ; Lochmaben; Dumfr...
1708	Barbodes wynaadensis	Vithry [India or Pakistan]
2066	Barbus callensis	Oued Tensift
2113	Nannocharax wittei	Between Kermani and Kasai [Belge Congo]
3247	Barbus nasus	Fes
3248	Barbus nasus	Fes
3362	Luciobarbus brachycephalus	Eurasia \| Union Of Soviet Socialist Republics ...
3369	Luciobarbus brachycephalus	Leukoran; Rec'd 24 Dec. 1885.
3446	Triplophysa grahami	; W. China; ; ; ; ; ; Yunnanfu
3465	Barbus petenyi	Milcov R. at Focsani, S Moldavia; Vrancea
3466	Barbus petenyi	Cerna R. at Baile-Herculane, Banat; Caras-Sev...
3467	Barbus petenyi	Hirtibaciu R., indirect trib. to Olt R. at Moh...
3666	Barbus petenyi	Croatia
4095	Sabanejewia bulgarica	Confluence of Arges R. with Danube R. at Olten...
4205	Coregonus nilssoni	Lake Ring, Scania
4209	Coregonus nilssoni	Lake Ring, Scania
4375	Haplochromis xenostoma	Lake Victoria [exact locality unknown]
4603	Haplochromis bartoni	Aquarium stock; originating from Lake Victoria.
4820	Sabanejewia vallachica	Milcov R. at Focsani, S Moldavia; Vrancea
4823	Sabanejewia vallachica	Ialomita R. at Crivina, N of Bucharest; Ilfov
6480	Devario kakhienensis	Phagna Dam.
6514	Devario browni	~25 km N Mae Hong Son town, on road to Chiang ...
6515	Devario browni	Mae Sariang district, 20 km SE of Mae Sariang...
6516	Devario browni	~8 km SW Mae Hong Son town, Huey Sertao, (old ...
6517	Devario browni	village of Mae Sam Laep, just above Huey Khong...
6518	Devario browni	~25 km N Mae Hong Son town, on road to Chiang ...
6519	Devario browni	~35 km S Mae Hong Son town in small stream; M...
6520	Devario browni	Pong Kan Stream, ~25 km S Mae Hong Son, Pong K...
6525	Devario browni	no data
6530	Devario browni	no data
6579	Chondrostoma cyri	R. Kurza; Rec'd. 4 Nov. 1891.
6862	Barbus callensis	Oued Za
6872	Barbus callensis	Qued Ksol
6877	Barbus callensis	Berkare
6885	Barbus callensis	[no verbatim locality data]
6889	Barbus callensis	Oued Tensift
7115	Barbus callensis	West Algeria
7116	Barbus callensis	[no verbatim locality data]
7117	Barbus callensis	West Algerian Sahara
7415	Synodontis omias	[no verbatim locality data]
7449	Pollimyrus guttatus	30 km East of Kribi, Cameroons

		count
species	basisofrecord
Abactochromis labrosus	PRESERVED_SPECIMEN	6
Acanthobrama microlepis	PRESERVED_SPECIMEN	12
Acanthocobitis pavonacea	PRESERVED_SPECIMEN	1
Acentrogobius therezieni	PRESERVED_SPECIMEN	9
Acheilognathus deignani	PRESERVED_SPECIMEN	2
Acheilognathus meridianus	PRESERVED_SPECIMEN	1
Acrochordonichthys gyrinus	PRESERVED_SPECIMEN	2
Acrossocheilus microstoma	PRESERVED_SPECIMEN	1
Ailiichthys punctata	PRESERVED_SPECIMEN	4
Akysis manipurensis	PRESERVED_SPECIMEN	4
Akysis pictus	PRESERVED_SPECIMEN	4
Akysis portellus	PRESERVED_SPECIMEN	1
Alburnoides eichwaldii	PRESERVED_SPECIMEN	18
Alburnoides fasciatus	PRESERVED_SPECIMEN	14
Alburnoides gmelini	PRESERVED_SPECIMEN	4
Alburnoides kubanicus	PRESERVED_SPECIMEN	5
Alburnoides maculatus	PRESERVED_SPECIMEN	8
Alburnoides rossicus	PRESERVED_SPECIMEN	23
Alburnus escherichii	PRESERVED_SPECIMEN	4
Alburnus filippii	PRESERVED_SPECIMEN	38
Alburnus tarichi	PRESERVED_SPECIMEN	4
Alosa killarnensis	PRESERVED_SPECIMEN	1
Ambastaia nigrolineata	OBSERVATION	1
Ambastaia nigrolineata	PRESERVED_SPECIMEN	1
Ambastaia sidthimunki	PRESERVED_SPECIMEN	1
Amblyceps carinatum	PRESERVED_SPECIMEN	1
Amblyceps protentum	PRESERVED_SPECIMEN	1
Anabarilius alburnops	PRESERVED_SPECIMEN	6
Aphyosemion abacinum	PRESERVED_SPECIMEN	9
Aphyosemion alpha	PRESERVED_SPECIMEN	5

		count
species	basisofrecord
Aphyosemion mimbon	PRESERVED_SPECIMEN	61
Barbus callensis	PRESERVED_SPECIMEN	122
Barbus ciscaucasicus	PRESERVED_SPECIMEN	673
Barbus fritschii	PRESERVED_SPECIMEN	95
Barbus petenyi	PRESERVED_SPECIMEN	553
Chondrostoma oxyrhynchum	PRESERVED_SPECIMEN	72
Cobitis stephanidisi	PRESERVED_SPECIMEN	62
Coregonus nilssoni	PRESERVED_SPECIMEN	59
Distichodus nefasch	PRESERVED_SPECIMEN	54
Haplochromis bareli	PRESERVED_SPECIMEN	117
Haplochromis crocopeplus	PRESERVED_SPECIMEN	65
Haplochromis dentex	PRESERVED_SPECIMEN	186
Haplochromis heusinkveldi	PRESERVED_SPECIMEN	1062
Haplochromis mento	PRESERVED_SPECIMEN	63
Haplochromis michaeli	PRESERVED_SPECIMEN	173
Haplochromis perrieri	PRESERVED_SPECIMEN	340
Haplochromis pyrrhopteryx	PRESERVED_SPECIMEN	54
Haplochromis tanaos	PRESERVED_SPECIMEN	140
Haplochromis xenostoma	PRESERVED_SPECIMEN	53
Oxynoemacheilus brandtii	PRESERVED_SPECIMEN	52

	year
species
Acanthobrama microlepis	[2006.0, 2006.0, 1966.0, 1966.0, 1966.0]
Acentrogobius therezieni	[1963.0, 1963.0, 1963.0]
Acrochordonichthys gyrinus	[1995.0, 1995.0]
Alburnoides eichwaldii	[2006.0, 2006.0, 2006.0, 2006.0, 2006.0]
Alburnoides fasciatus	[2010.0, 2010.0, 2007.0, 2007.0, 2007.0, 2006....
Alburnoides gmelini	[2004.0, 2004.0, 2004.0, 2004.0]
Alburnoides rossicus	[2012.0, 2012.0, 2012.0, 2012.0]
Alburnus escherichii	[2006.0, 2006.0, 1990.0, 1990.0]
Alburnus filippii	[2012.0, 2010.0, 2006.0]
Ambastaia nigrolineata	[2011.0]
Ambastaia sidthimunki	[2007.0]
Amblyceps protentum	[2012.0]
Aphyosemion abacinum	[1976.0, 1976.0]
Aphyosemion alpha	[1994.0, 1993.0, 1993.0, 1993.0]
Aphyosemion chauchei	[1978.0, 1978.0]
Aphyosemion congicum	[1971.0]
Aphyosemion exigoideum	[1977.0, 1976.0]
Aphyosemion mimbon	[1976.0]
Aphyosemion seegersi	[1978.0, 1978.0]
Aplocheilichthys antinorii	[1982.0]
Arius madagascariensis	[2002.0, 1988.0, 1988.0, 1964.0, 1962.0, 1962.0]
Astatoreochromis vanderhorsti	[1992.0, 1992.0, 1992.0, 1991.0, 1983.0]
Astatotilapia flaviijosephi	[2002.0, 1972.0]
Aulonocara ethelwynnae	[1985.0, 1985.0]
Aulonocara hansbaenschi	[1985.0, 1985.0]
Aulonocara korneliae	[1985.0, 1985.0]
Aulonocara maylandi	[1985.0, 1984.0, 1980.0]
Aulonocara steveni	[1985.0, 1985.0]
Aulonocara stonemani	[1973.0, 1971.0, 1971.0, 1971.0]
Barbus aliciae	[1980.0]

	count
species
Aaptosyax grypus	2
Aborichthys elongatus	1
Abramis brama	114212
Acantharchus pomotis	477
Acanthobrama centisquama	1
Acanthobrama lissneri	58
Acanthobrama marmid	18
Acanthobrama telavivensis	39
Acanthobrama terraesanctae	11
Acanthobrama tricolor	1

	numobservations
species
Abramis brama	113700
Acantharchus pomotis	463
Acanthogobius flavimanus	662
Acheilognathus macropterus	94
Achondrostoma arcasii	3113
Acipenser brevirostrum	121
Acipenser fulvescens	169
Acipenser oxyrinchus	278
Acipenser sturio	67
Acipenser transmontanus	273
Acrocheilus alutaceus	162
Agonostomus monticola	526
Agosia chrysogaster	272
Alburnus alburnus	14827
Alburnus neretvae	52
Aldrichetta forsteri	1221
Alestes ansorgii	78
Alestes baremoze	123
Alestes dentex	63
Alestes macrophthalmus	137
Alosa aestivalis	1510
Alosa alabamae	334
Alosa alosa	344
Alosa fallax	16675
Alosa mediocris	112
Alosa pseudoharengus	7625
Alosa sapidissima	2276
Altolamprologus compressiceps	73
Ambassis ambassis	73
Ambassis gymnocephalus	165
...	...
Thymallus arcticus	1509
Thymallus thymallus	5864
Thysochromis ansorgii	56
Tilapia cabrae	72
Tilapia cameronensis	68
Tilapia guineensis	355
Tilapia mariae	602
Tilapia rendalli	1134
Tilapia ruweti	189
Tilapia sparrmanii	1921
Tilapia tholloni	83
Tinca tinca	35984
Tor putitora	59
Toxotes jaculatrix	77
Trichopodus pectoralis	55
Trichopodus trichopterus	163
Trichopsis vittata	138
Trinectes maculatus	4907
Tropheus moorii	149
Tylochromis lateralis	58
Typhlichthys subterraneus	89
Umbra limi	1389
Umbra pygmaea	2692
Varicorhinus nelspruitensis	56
Vimba vimba	1440
Xenentodon cancila	94
Xenentodon canciloides	52
Xenomystus nigri	138
Xenotilapia spiloptera	67
Zenarchopterus dispar	71

	numobservations
species
Abramis brama	109869
Acantharchus pomotis	152
Acanthogobius flavimanus	370
Acheilognathus macropterus	70
Achondrostoma arcasii	3113
Acipenser fulvescens	128
Acipenser oxyrinchus	137
Acipenser sturio	50
Acipenser transmontanus	218
Acrocheilus alutaceus	77
Agonostomus monticola	305
Agosia chrysogaster	83
Alburnus alburnus	13411
Aldrichetta forsteri	399
Alestes ansorgii	64
Alestes baremoze	52
Alestes macrophthalmus	90
Alosa aestivalis	395
Alosa alosa	250
Alosa fallax	7310
Alosa pseudoharengus	2407
Alosa sapidissima	940
Ambassis gymnocephalus	101
Ambassis interrupta	198
Ambassis vachellii	212
Ambloplites ariommus	435
Ambloplites cavifrons	59
Ambloplites rupestris	1686
Ameiurus brunneus	458
Ameiurus catus	221
...	...
Telestes metohiensis	58
Telestes souffia	136
Telestes ukliva	58
Terapon jarbua	538
Terapon theraps	1271
Thaleichthys pacificus	1012
Thoburnia rhothoeca	66
Thoracochromis buysi	72
Thymallus arcticus	695
Thymallus thymallus	4655
Tilapia cabrae	62
Tilapia guineensis	153
Tilapia mariae	467
Tilapia rendalli	554
Tilapia ruweti	94
Tilapia sparrmanii	837
Tilapia tholloni	67
Tinca tinca	33448
Tor putitora	57
Trichopodus trichopterus	106
Trichopsis vittata	108
Trinectes maculatus	2732
Tropheus moorii	90
Typhlichthys subterraneus	73
Umbra limi	471
Umbra pygmaea	2358
Vimba vimba	1134
Xenentodon cancila	63
Xenomystus nigri	111
Xenotilapia spiloptera	58

	binomial	category	citation	class_name	compiler	dist_comm	family_nam	genus_name	geometry	id_no	...	presence	seasonal	shape_area	shape_leng	source	species_na	subpop	subspecies	tax_comm	year
10371	Esox lucius	LC	NatureServe	ACTINOPTERYGII	Freshwater Biodiversity Unit, IUCN	None	ESOCIDAE	Esox	(POLYGON ((-100.381377156 40.84223395400005, -...	135631.0	...	1.0	0.0	3.550082	31.832295	Digital Distribution Maps of the Freshwater Fi...	lucius	None	None	None	2013.0
10368	Esox lucius	LC	None	ACTINOPTERYGII	None	None	ESOCIDAE	Esox	(POLYGON ((-112.028315735 47.14668409600006, -...	135631.0	...	2.0	1.0	6.238672	24.383191	None	lucius	None	None	None	0.0
10367	Esox lucius	LC	None	ACTINOPTERYGII	None	None	ESOCIDAE	Esox	POLYGON ((106.4119327120001 50.65637715700007,...	135631.0	...	0.0	0.0	31.804175	51.945832	None	lucius	None	None	None	0.0
10369	Esox lucius	LC	None	ACTINOPTERYGII	None	None	ESOCIDAE	Esox	(POLYGON ((-9.20954827199995 39.39943271200008...	135631.0	...	1.0	1.0	57.242965	52.589760	None	lucius	None	None	None	0.0
10366	Esox lucius	LC	None	ACTINOPTERYGII	None	None	ESOCIDAE	Esox	(POLYGON ((-98.63749999999999 47.9041666670000...	135631.0	...	1.0	0.0	125.347175	344.480096	None	lucius	None	None	None	0.0
10370	Esox lucius	LC	None	ACTINOPTERYGII	None	None	ESOCIDAE	Esox	(POLYGON ((-4.770833332999928 48.5250000000000...	135631.0	...	1.0	1.0	5225.451235	4405.111110	None	lucius	None	None	None	0.0

	binomial	category	citation	class_name	compiler	dist_comm	family_nam	genus_name	geometry	id_no	...	presence	seasonal	shape_area	shape_leng	source	species_na	subpop	subspecies	tax_comm	year
10322	Acrocheilus alutaceus	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Acrocheilus	(POLYGON ((-118.533976237 49.08130154100007, -...	201940.0	...	1.0	0.0	0.361865	4.537151	None	alutaceus	None	None	None	0.0
10320	Acrocheilus alutaceus	LC	None	ACTINOPTERYGII	None	None	CYPRINIDAE	Acrocheilus	(POLYGON ((-120.529733955 51.43137715600005, -...	201940.0	...	1.0	1.0	8.364796	37.046891	None	alutaceus	None	None	None	0.0
10321	Acrocheilus alutaceus	LC	NatureServe	ACTINOPTERYGII	Freshwater Biodiversity Unit, IUCN	None	CYPRINIDAE	Acrocheilus	(POLYGON ((-124.042233954 46.28038160500006, -...	201940.0	...	1.0	0.0	36.707338	70.318100	Digital Distribution Maps of the Freshwater Fi...	alutaceus	None	None	None	2013.0

	Species	CTmax.20	LTmax.20	mean
0	Abudefduf saxatilis	36.7	-	36.70
1	Abudefduf troschelii	36.1	-	36.10
2	Acipenser brevirostrum	33.7	-	33.70
3	Agosia chrysogaster	-	36.4	36.40
4	Alosa pseudoharengus	32.4	-	32.40
5	Ameiurus melas	35.9	-	35.90
6	Ameiurus natalis	35.7	36	35.85
7	Apogon dovii	34.7	-	34.70
8	Apogon maculatus	35	-	35.00
9	Apogon novemfasciatus	35.2	-	35.20

	basisofrecord	dateidentified	day	decimallatitude	decimallongitude	eventdate	month	species	year
3201738	HUMAN_OBSERVATION	2016-02-20T22:23:11.000+0000	20.0	43.64776	-73.21035	2016-02-19T23:00:00.000+0000	2.0	Esox lucius	2016.0
3201739	HUMAN_OBSERVATION	2016-02-14T22:57:42.000+0000	14.0	43.64294	-73.21495	2016-02-13T23:00:00.000+0000	2.0	Esox lucius	2016.0
3201740	HUMAN_OBSERVATION	2016-03-15T19:00:38.000+0000	15.0	41.39168	-88.16611	2016-03-15T17:53:12.000+0000	3.0	Esox lucius	2016.0
3201741	HUMAN_OBSERVATION	2016-04-18T22:00:00.000+0000	19.0	52.23420	4.95997	2016-04-19T18:06:00.000+0000	4.0	Esox lucius	2016.0
3201742	HUMAN_OBSERVATION	NaN	13.0	60.20395	5.46997	2016-04-12T22:00:00.000+0000	4.0	Esox lucius	2016.0
3201743	HUMAN_OBSERVATION	NaN	24.0	58.49895	8.76855	2016-04-23T22:00:00.000+0000	4.0	Esox lucius	2016.0
3201744	HUMAN_OBSERVATION	2016-04-10T07:58:30.000+0000	9.0	46.01636	11.27527	2016-04-08T22:00:00.000+0000	4.0	Esox lucius	2016.0
3201745	HUMAN_OBSERVATION	NaN	31.0	59.37117	10.88093	2016-05-30T22:00:00.000+0000	5.0	Esox lucius	2016.0
3201746	HUMAN_OBSERVATION	NaN	22.0	60.68136	11.98389	2016-05-21T22:00:00.000+0000	5.0	Esox lucius	2016.0
3201747	HUMAN_OBSERVATION	NaN	22.0	59.88509	11.13358	2016-05-21T22:00:00.000+0000	5.0	Esox lucius	2016.0
3201748	HUMAN_OBSERVATION	2016-05-06T22:00:00.000+0000	7.0	46.78720	13.61220	2016-05-07T10:02:00.000+0000	5.0	Esox lucius	2016.0
3201749	HUMAN_OBSERVATION	2016-05-29T08:50:22.000+0000	28.0	51.54395	5.26373	2016-05-28T08:02:58.000+0000	5.0	Esox lucius	2016.0
3201750	HUMAN_OBSERVATION	2016-05-06T22:00:00.000+0000	7.0	52.32960	4.66999	2016-05-07T09:36:00.000+0000	5.0	Esox lucius	2016.0
3201751	HUMAN_OBSERVATION	2015-02-02T09:39:54.000+0000	9.0	53.99756	81.29393	2015-01-08T23:00:00.000+0000	1.0	Esox lucius	2015.0
3201752	HUMAN_OBSERVATION	2015-02-22T21:06:11.000+0000	21.0	44.16222	-73.38330	2015-02-20T23:00:00.000+0000	2.0	Esox lucius	2015.0
3201753	HUMAN_OBSERVATION	2015-02-22T20:51:02.000+0000	21.0	43.65059	-73.20540	2015-02-20T23:00:00.000+0000	2.0	Esox lucius	2015.0
3201754	HUMAN_OBSERVATION	NaN	31.0	56.74260	16.30920	2015-03-30T22:00:00.000+0000	3.0	Esox lucius	2015.0
3201755	HUMAN_OBSERVATION	NaN	28.0	63.61770	15.61820	2015-03-27T23:00:00.000+0000	3.0	Esox lucius	2015.0
3201756	HUMAN_OBSERVATION	NaN	21.0	59.76640	17.56830	2015-03-20T23:00:00.000+0000	3.0	Esox lucius	2015.0
3201757	PRESERVED_SPECIMEN	2015-03-26T23:00:00.000+0000	27.0	61.73664	-150.90074	2015-03-26T23:00:00.000+0000	3.0	Esox lucius	2015.0
3201758	HUMAN_OBSERVATION	NaN	9.0	56.66810	16.29040	2015-04-08T22:00:00.000+0000	4.0	Esox lucius	2015.0
3201759	HUMAN_OBSERVATION	NaN	15.0	60.25310	17.70750	2015-04-14T22:00:00.000+0000	4.0	Esox lucius	2015.0
3201760	HUMAN_OBSERVATION	NaN	3.0	56.70040	16.28510	2015-04-02T22:00:00.000+0000	4.0	Esox lucius	2015.0
3201761	HUMAN_OBSERVATION	2015-04-06T20:17:54.000+0000	6.0	40.27955	-106.85029	2015-04-05T22:00:00.000+0000	4.0	Esox lucius	2015.0
3201762	HUMAN_OBSERVATION	2015-04-21T22:00:00.000+0000	22.0	52.23420	4.95997	2015-04-22T17:04:00.000+0000	4.0	Esox lucius	2015.0
3201763	HUMAN_OBSERVATION	NaN	9.0	57.08160	16.53970	2015-04-08T22:00:00.000+0000	4.0	Esox lucius	2015.0
3201764	HUMAN_OBSERVATION	NaN	10.0	56.73870	15.91930	2015-04-09T22:00:00.000+0000	4.0	Esox lucius	2015.0
3201765	HUMAN_OBSERVATION	NaN	9.0	56.88990	15.86350	2015-04-08T22:00:00.000+0000	4.0	Esox lucius	2015.0
3201766	HUMAN_OBSERVATION	NaN	14.0	59.88308	11.12932	2015-05-13T22:00:00.000+0000	5.0	Esox lucius	2015.0
3201767	PRESERVED_SPECIMEN	2015-05-13T22:00:00.000+0000	14.0	61.88902	-150.80570	2015-05-13T22:00:00.000+0000	5.0	Esox lucius	2015.0
...	...	...	...	...	...	...	...	...	...
3282939	PRESERVED_SPECIMEN	2004-08-31T22:00:00.000+0000	1.0	65.37500	-142.50833	1961-07-31T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282940	PRESERVED_SPECIMEN	NaN	21.0	46.01786	-89.65858	1961-08-20T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282941	PRESERVED_SPECIMEN	2004-08-31T22:00:00.000+0000	13.0	58.45000	-155.91667	1961-08-12T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282942	PRESERVED_SPECIMEN	2004-08-31T22:00:00.000+0000	18.0	65.40833	-143.55000	1961-08-17T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282944	PRESERVED_SPECIMEN	NaN	1.0	53.75000	-90.00000	1961-07-31T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282946	PRESERVED_SPECIMEN	2004-08-31T22:00:00.000+0000	15.0	65.20000	-141.71667	1961-08-14T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282947	HUMAN_OBSERVATION	NaN	2.0	60.66667	-115.96667	1961-08-01T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282948	PRESERVED_SPECIMEN	2004-08-31T22:00:00.000+0000	14.0	59.75000	-161.93333	1961-08-13T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282949	HUMAN_OBSERVATION	NaN	3.0	58.75000	-117.76667	1961-08-02T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282950	PRESERVED_SPECIMEN	2004-08-31T22:00:00.000+0000	4.0	65.00000	-141.33333	1961-08-03T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282951	PRESERVED_SPECIMEN	NaN	21.0	46.01150	-89.67583	1961-08-20T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282953	OBSERVATION	NaN	2.0	51.37384	-0.49129	1961-08-01T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282954	PRESERVED_SPECIMEN	NaN	1.0	53.75000	-90.00000	1961-07-31T23:00:00.000+0000	8.0	Esox lucius	1961.0
3282956	PRESERVED_SPECIMEN	NaN	7.0	68.21700	-135.90000	1961-09-06T23:00:00.000+0000	9.0	Esox lucius	1961.0
3282959	PRESERVED_SPECIMEN	NaN	15.0	57.91145	-69.04730	1961-09-14T23:00:00.000+0000	9.0	Esox lucius	1961.0
3282961	PRESERVED_SPECIMEN	NaN	7.0	68.21700	-135.90000	1961-09-06T23:00:00.000+0000	9.0	Esox lucius	1961.0
3282980	OBSERVATION	NaN	20.0	51.74055	-1.20336	1961-12-19T23:00:00.000+0000	12.0	Esox lucius	1961.0
3282981	HUMAN_OBSERVATION	NaN	NaN	55.62881	9.23692	NaN	NaN	Esox lucius	1961.0
3282982	OBSERVATION	NaN	NaN	51.88537	0.97914	NaN	NaN	Esox lucius	1961.0
3282983	OBSERVATION	NaN	NaN	51.97516	0.98510	NaN	NaN	Esox lucius	1961.0
3282985	OBSERVATION	NaN	NaN	54.85545	-4.88238	NaN	NaN	Esox lucius	1961.0
3282986	OBSERVATION	NaN	NaN	54.25853	-2.69086	NaN	NaN	Esox lucius	1961.0
3282987	HUMAN_OBSERVATION	NaN	NaN	55.00006	15.07703	NaN	NaN	Esox lucius	1961.0
3282988	OBSERVATION	NaN	NaN	54.34625	-3.00005	NaN	NaN	Esox lucius	1961.0
3282989	HUMAN_OBSERVATION	NaN	NaN	55.34827	10.65457	NaN	NaN	Esox lucius	1961.0
3282990	HUMAN_OBSERVATION	NaN	NaN	55.69418	12.53256	NaN	NaN	Esox lucius	1961.0
3282991	HUMAN_OBSERVATION	NaN	NaN	55.71824	8.60073	NaN	NaN	Esox lucius	1961.0
3282992	HUMAN_OBSERVATION	NaN	NaN	55.08262	10.33026	NaN	NaN	Esox lucius	1961.0
3282993	HUMAN_OBSERVATION	NaN	NaN	55.17246	10.33325	NaN	NaN	Esox lucius	1961.0
3282994	HUMAN_OBSERVATION	NaN	NaN	56.34654	9.56493	NaN	NaN	Esox lucius	1961.0

	basisofrecord	dateidentified	day	decimallatitude	decimallongitude	eventdate	month	species	year
957834	PRESERVED_SPECIMEN	2011-03-15T23:00:00.000+0000	26.0	-8.76631	31.10692	2011-02-25T23:00:00.000+0000	2.0	Astatotilapia burtoni	2011.0
957838	PRESERVED_SPECIMEN	2011-12-31T23:00:00.000+0000	20.0	-8.76667	31.11667	2008-04-19T22:00:00.000+0000	4.0	Astatotilapia burtoni	2008.0
957839	PRESERVED_SPECIMEN	2011-12-31T23:00:00.000+0000	21.0	-8.76667	31.11667	2008-04-20T22:00:00.000+0000	4.0	Astatotilapia burtoni	2008.0
957840	PRESERVED_SPECIMEN	NaN	1.0	29.06190	-4.30921	2006-12-31T23:00:00.000+0000	1.0	Astatotilapia burtoni	2007.0
957841	PRESERVED_SPECIMEN	NaN	1.0	29.06190	-4.30921	2006-12-31T23:00:00.000+0000	1.0	Astatotilapia burtoni	2007.0
957842	UNKNOWN	2006-03-07T23:00:00.000+0000	17.0	21.43000	-104.82900	2005-10-16T22:00:00.000+0000	10.0	Astatotilapia burtoni	2005.0
957843	PRESERVED_SPECIMEN	2005-08-09T22:00:00.000+0000	7.0	-8.51817	30.48000	2004-03-06T23:00:00.000+0000	3.0	Astatotilapia burtoni	2004.0
957844	PRESERVED_SPECIMEN	2010-05-30T22:00:00.000+0000	12.0	-8.59556	31.18528	2004-03-11T23:00:00.000+0000	3.0	Astatotilapia burtoni	2004.0
957845	PRESERVED_SPECIMEN	2007-08-15T22:00:00.000+0000	10.0	-8.76750	31.11167	2004-03-09T23:00:00.000+0000	3.0	Astatotilapia burtoni	2004.0
957846	PRESERVED_SPECIMEN	2007-08-12T22:00:00.000+0000	6.0	-8.61167	30.73967	2004-03-05T23:00:00.000+0000	3.0	Astatotilapia burtoni	2004.0
957847	PRESERVED_SPECIMEN	2010-05-30T22:00:00.000+0000	12.0	-8.59556	31.18528	2004-03-11T23:00:00.000+0000	3.0	Astatotilapia burtoni	2004.0
957848	PRESERVED_SPECIMEN	2007-08-12T22:00:00.000+0000	6.0	-8.62000	30.72283	2004-03-05T23:00:00.000+0000	3.0	Astatotilapia burtoni	2004.0
957849	PRESERVED_SPECIMEN	2004-03-11T23:00:00.000+0000	12.0	-8.59889	31.18417	2004-03-11T23:00:00.000+0000	3.0	Astatotilapia burtoni	2004.0
957850	PRESERVED_SPECIMEN	2010-05-30T22:00:00.000+0000	12.0	-8.59556	31.18528	2004-03-11T23:00:00.000+0000	3.0	Astatotilapia burtoni	2004.0
957851	PRESERVED_SPECIMEN	2000-12-31T23:00:00.000+0000	19.0	-8.58883	31.18667	2001-10-18T22:00:00.000+0000	10.0	Astatotilapia burtoni	2001.0
957852	PRESERVED_SPECIMEN	2000-12-31T23:00:00.000+0000	17.0	-8.77200	31.13983	2001-10-16T22:00:00.000+0000	10.0	Astatotilapia burtoni	2001.0
957853	PRESERVED_SPECIMEN	2000-12-31T23:00:00.000+0000	17.0	-8.77200	31.13983	2001-10-16T22:00:00.000+0000	10.0	Astatotilapia burtoni	2001.0
957869	PRESERVED_SPECIMEN	2002-12-31T23:00:00.000+0000	23.0	-9.10000	31.48333	1995-10-22T23:00:00.000+0000	10.0	Astatotilapia burtoni	1995.0
957870	PRESERVED_SPECIMEN	NaN	30.0	-8.76667	31.11667	1994-09-29T23:00:00.000+0000	9.0	Astatotilapia burtoni	1994.0
957871	PRESERVED_SPECIMEN	1992-12-31T23:00:00.000+0000	23.0	-3.33333	29.25000	1993-07-22T22:00:00.000+0000	7.0	Astatotilapia burtoni	1993.0
957873	PRESERVED_SPECIMEN	1993-12-31T23:00:00.000+0000	27.0	-2.53333	30.10000	1993-07-26T22:00:00.000+0000	7.0	Astatotilapia burtoni	1993.0
957875	PRESERVED_SPECIMEN	1993-12-31T23:00:00.000+0000	27.0	-2.53333	30.10000	1993-07-26T22:00:00.000+0000	7.0	Astatotilapia burtoni	1993.0
957876	PRESERVED_SPECIMEN	1993-12-31T23:00:00.000+0000	27.0	-2.53333	30.10000	1993-07-26T22:00:00.000+0000	7.0	Astatotilapia burtoni	1993.0
957877	PRESERVED_SPECIMEN	1993-12-31T23:00:00.000+0000	26.0	-2.53333	30.10000	1993-07-25T22:00:00.000+0000	7.0	Astatotilapia burtoni	1993.0
957878	PRESERVED_SPECIMEN	1994-12-31T23:00:00.000+0000	20.0	-5.21667	29.80000	1993-08-19T22:00:00.000+0000	8.0	Astatotilapia burtoni	1993.0
957885	PRESERVED_SPECIMEN	1993-12-31T23:00:00.000+0000	20.0	-5.21667	29.80000	1993-08-19T22:00:00.000+0000	8.0	Astatotilapia burtoni	1993.0
957892	PRESERVED_SPECIMEN	1993-12-31T23:00:00.000+0000	11.0	-2.45000	30.28333	1993-08-10T22:00:00.000+0000	8.0	Astatotilapia burtoni	1993.0
957905	PRESERVED_SPECIMEN	1993-12-31T23:00:00.000+0000	30.0	-6.59833	30.27133	1992-05-29T22:00:00.000+0000	5.0	Astatotilapia burtoni	1992.0
957907	PRESERVED_SPECIMEN	1993-12-31T23:00:00.000+0000	30.0	-6.59833	30.27133	1992-05-29T22:00:00.000+0000	5.0	Astatotilapia burtoni	1992.0
957945	PRESERVED_SPECIMEN	1993-12-31T23:00:00.000+0000	29.0	-3.86667	29.38333	1991-03-28T23:00:00.000+0000	3.0	Astatotilapia burtoni	1991.0
957950	PRESERVED_SPECIMEN	1993-12-31T23:00:00.000+0000	15.0	-3.13333	29.26667	1991-03-14T23:00:00.000+0000	3.0	Astatotilapia burtoni	1991.0
957965	PRESERVED_SPECIMEN	1991-12-31T23:00:00.000+0000	13.0	-3.08333	29.25000	1991-08-12T22:00:00.000+0000	8.0	Astatotilapia burtoni	1991.0
957994	PRESERVED_SPECIMEN	NaN	18.0	-8.78330	31.13330	1991-11-17T23:00:00.000+0000	11.0	Astatotilapia burtoni	1991.0
957995	PRESERVED_SPECIMEN	NaN	15.0	-8.75000	31.16667	1991-11-14T23:00:00.000+0000	11.0	Astatotilapia burtoni	1991.0
958029	PRESERVED_SPECIMEN	1985-12-31T23:00:00.000+0000	8.0	-2.20000	30.23333	1986-08-07T22:00:00.000+0000	8.0	Astatotilapia burtoni	1986.0
958030	PRESERVED_SPECIMEN	1985-12-31T23:00:00.000+0000	8.0	-2.20000	30.23333	1986-08-07T22:00:00.000+0000	8.0	Astatotilapia burtoni	1986.0
958031	PRESERVED_SPECIMEN	1985-12-31T23:00:00.000+0000	15.0	-2.25000	30.13333	1986-10-14T23:00:00.000+0000	10.0	Astatotilapia burtoni	1986.0
958032	PRESERVED_SPECIMEN	1993-12-31T23:00:00.000+0000	27.0	-2.20000	30.36667	1985-07-26T22:00:00.000+0000	7.0	Astatotilapia burtoni	1985.0
958033	PRESERVED_SPECIMEN	2005-12-31T23:00:00.000+0000	23.0	-2.46667	30.30000	1981-10-22T23:00:00.000+0000	10.0	Astatotilapia burtoni	1981.0
958034	PRESERVED_SPECIMEN	2005-12-31T23:00:00.000+0000	1.0	-2.46667	30.30000	1981-11-30T23:00:00.000+0000	12.0	Astatotilapia burtoni	1981.0
958035	PRESERVED_SPECIMEN	1976-12-31T23:00:00.000+0000	1.0	-8.51667	30.70000	1975-12-31T23:00:00.000+0000	1.0	Astatotilapia burtoni	1976.0
958043	PRESERVED_SPECIMEN	NaN	1.0	-8.71052	31.11581	1972-05-31T23:00:00.000+0000	6.0	Astatotilapia burtoni	1972.0
958047	PRESERVED_SPECIMEN	1976-12-31T23:00:00.000+0000	27.0	-8.76667	31.11667	1967-07-26T23:00:00.000+0000	7.0	Astatotilapia burtoni	1967.0
958054	PRESERVED_SPECIMEN	1965-12-31T23:00:00.000+0000	18.0	-8.76667	31.11667	1966-02-17T23:00:00.000+0000	2.0	Astatotilapia burtoni	1966.0
958057	PRESERVED_SPECIMEN	1965-12-31T23:00:00.000+0000	18.0	-8.76667	31.11667	1966-02-17T23:00:00.000+0000	2.0	Astatotilapia burtoni	1966.0
958063	PRESERVED_SPECIMEN	1976-12-31T23:00:00.000+0000	1.0	-3.40000	29.13333	1960-12-31T23:00:00.000+0000	1.0	Astatotilapia burtoni	1961.0