jupyter.idigbio.org Pyspark3


In [15]:
sqlContext


Out[15]:
<pyspark.sql.context.SQLContext at 0x7f52695fa240>

In [16]:
index = "idigbio"
nodes = "c18node14.acis.ufl.edu,c18node2.acis.ufl.edu,c18node6.acis.ufl.edu,c18node10.acis.ufl.edu,c18node12.acis.ufl.edu"
query = '{"query": {"bool": {"must": [{"term":{"genus":"acer"}}, {"term":{"stateprovince":"vermont"}}]}}}'
fields = ("uuid,kingdom,phylum,order,class,family,genus,group,specificepithet,infraspecificepithet,scientificname,commonname,canonicalname,highertaxon,"
          "datecollected,continent,country,countrycode,stateprovince,municipality,waterbody,"
          "occurenceid,catalognumber,fieldnumber,collectioncode,collectionid,collector,barcodevalue,basisofrecord,individualcount"
)

fields = "uuid,data.dwc:eventDate"

In [17]:
# Let's try using the API to get a list of column names

import requests

meta_fields_records = (requests
                       .get("http://search.idigbio.org/v2/meta/fields/records")
                       .json()
                       )

field_set = set()
for k,v in meta_fields_records.items():
    if v.get("fieldName", False):
        field_set.add(k)
        
    if k == "data":
        for kd,vd in v.items():
            if vd.get("fieldName", False):
                field_set.add("data.{0}".format(kd))
                pass
        
#print(sorted(fields))
#field_set.remove("geopoint")
#field_set.remove("flags")

#field_list = sorted(field_set)[0:round(len(field_set)/2)]
#field_list = sorted(field_set)[round(len(field_set)/2):]

#field_list = field_list[0:round(len(field_list)/2)]
#field_list = field_list[round(len(field_list)/2):]
# fails too

#field_list = field_list[0:round(len(field_list)/2)]
#field_list = field_list[round(len(field_list)/2):]

#field_list = field_list[0:round(len(field_list)/2)]

fields = ",".join(field_set)

print(fields)


data.dcterms:source,etag,member,institutionid,data.dcterms:license,data.dwc:identificationReferences,data.dwc:highestBiostratigraphicZone,continent,data.dwc:scientificName,data.dwc:higherClassification,data.dwc:waterBody,data.dwc:datasetName,data.dwc:eventID,data.dwc:identifiedBy,data.dwc:maximumElevationInMeters,order,canonicalname,data.fcc:datePicked,version,institutionname,data.dwc:latestEraOrHighestErathem,maxelevation,verbatimeventdate,data.dwc:group,data.dwc:startDayOfYear,data.dwc:dataGeneralizations,data.dwc:acceptedNameUsage,flags,data.dcterms:references,latesteraorhighesterathem,family,scientificname,data.dwc:habitat,data.dwc:rightsHolder,data.dcterms:bibliographicCitation,data.dwc:dynamicProperties,data.dwc:specificEpithet,data.fcc:pickedBy,data.dwc:nameAccordingToID,class,data.dwc:taxonRemarks,data.dwc:maximumDepthInMeters,municipality,data.dwc:earliestAgeOrLowestStage,highertaxon,datemodified,country,data.dwc:collectionID,data.dwc:coordinateUncertaintyInMeters,infraspecificepithet,data.dwc:endDayOfYear,data.dwc:namePublishedIn,earliestperiodorlowestsystem,hasMedia,data.dwc:latestPeriodOrHighestSystem,collectioncode,data.dwc:recordedBy,dqs,catalognumber,hasImage,data.dwc:identificationRemarks,data.dwc:county,data.dwc:otherCatalogNumbers,highestbiostratigraphiczone,data.dwc:eventRemarks,data.dwc:previousIdentifications,fieldnumber,institutioncode,data.dwc:bed,data.dwc:identificationQualifier,data.dwc:nameAccordingTo,data.dwc:originalNameUsage,data.dwc:institutionCode,data.dwc:preparations,collectionid,data.dc:rights,data.dwc:lowestBiostratigraphicZone,data.dwc:phylum,data.dwc:recordNumber,occurrenceid,data.dwc:georeferencedDate,data.dwc:day,data.dwc:latestAgeOrHighestStage,data.dwc:verbatimEventDate,commonname,latestepochorhighestseries,data.dwc:infraspecificEpithet,data.dwc:genus,verbatimlocality,countrycode,data.dwc:individualID,data.dwc:nomenclaturalCode,waterbody,data.dwc:identificationVerificationStatus,data.dwc:occurrenceRemarks,data.dwc:taxonRank,data.idigbio:preservative,locality,data.dwc:verbatimElevation,data.idigbio:superfamily,genus,data.dwc:minimumDepthInMeters,data.dwc:municipality,recordset,data.dwc:verbatimCoordinateSystem,uuid,data.dwc:taxonomicStatus,data.dwc:subgenus,data.dwc:namePublishedInID,data.dcterms:language,data.dwc:samplingEffort,data.dwc:georeferenceSources,data.dwc:georeferenceProtocol,kingdom,data.dwc:coordinatePrecision,data.dwc:associatedMedia,data.dwc:ownerInstitutionCode,data.dcterms:modified,data.dwc:individualCount,data.dwc:associatedTaxa,coordinateuncertainty,geologicalcontextid,data.dwc:georeferencedBy,barcodevalue,data.dwc:stateProvince,data.dwc:dateIdentified,data.dwc:establishmentMeans,taxonomicstatus,data.dwc:parentNameUsage,data.dwc:basisOfRecord,data.dwc:year,data.dwc:georeferenceVerificationStatus,data.dwc:locationID,data.dwc:higherGeography,data.dwc:islandGroup,data.dwc:samplingProtocol,specificepithet,taxonrank,data.dwc:institutionID,geopoint,minelevation,earliesteonorlowesteonothem,data.dwc:accessRights,data.dwc:vernacularName,data.dcterms:rightsHolder,data.dwc:country,stateprovince,earliestageorloweststage,data.dwc:datasetID,datecollected,data.dwc:latestEonOrHighestEonothem,data.dwc:verbatimSRS,typestatus,data.dwc:latestEpochOrHighestSeries,collectionname,data.dwc:decimalLatitude,data.dwc:disposition,data.dwc:footprintWKT,data.dwc:formation,data.dwc:associatedSequences,data.dwc:verbatimLongitude,data.dwc:associatedOccurrences,data.idigbio:recordId,lithostratigraphicterms,data.dwc:countryCode,formation,data.dwc:taxonID,data.dwc:namePublishedInYear,individualcount,mindepth,data.dwc:decimalLongitude,data.dwc:typeStatus,data.dwc:georeferenceRemarks,data.dwc:month,data.dwc:locationAccordingTo,commonnames,latesteonorhighesteonothem,data.dwc:occurrenceStatus,data.dwc:informationWithheld,data.dwc:locality,eventdate,earliesteraorlowesterathem,data.symbiota:verbatimScientificName,data.dcterms:rights,data.dwc:VerbatimEventDate,data.coreid,data.dwc:continent,data.dwc:catalogNumber,bed,data.idigbio:subfamily,data.dwc:earliestEonOrLowestEonothem,data.dwc:lifeStage,startdayofyear,data.dwc:eventTime,data.dwc:sex,data.dwc:order,data.dwc:island,group,data.dwc:kingdom,collector,mediarecords,recordids,data.dwc:lithostratigraphicTerms,data.dwc:scientificNameID,earliestepochorlowestseries,data.dwc:verbatimCoordinates,phylum,latestageorhigheststage,data.dwc:geologicalContextID,data.dcterms:type,data.dwc:eventDate,data.dwc:geodeticDatum,data.dwc:identificationID,data.dwc:earliestEpochOrLowestSeries,data.dwc:reproductiveCondition,data.dwc:minimumElevationInMeters,basisofrecord,data.id,data.dwc:class,data.dwc:nomenclaturalStatus,data.dwc:verbatimDepth,data.idigbio:substrate,data.dwc:verbatimLocality,data.symbiota:recordEnteredBy,data.dwc:earliestPeriodOrLowestSystem,data.dcterms:accessRights,recordnumber,data.dwc:higherGeographyID,data.dwc:locationRemarks,data.dwc:fieldNotes,data.dwc:collectionCode,lowestbiostratigraphiczone,data.dwc:scientificNameAuthorship,data.dwc:verbatimTaxonRank,taxonid,data.dwc:behavior,data.dwc:family,data.dwc:member,data.dwc:occurrenceID,data.dwc:verbatimLatitude,data.dwc:occurrenceDetails,county,maxdepth,data.dwc:organismID,data.dwc:fieldNumber,latestperiodorhighestsystem,data.dwc:rights,data.dwc:earliestEraOrLowestErathem,data.dwc:associatedReferences

In [19]:
bad_field_set = set()
for field in sorted(field_set):
        try:
            df = (sqlContext.read.format("org.elasticsearch.spark.sql")
                .option("es.query", query)
                .option("es.read.field.include", field)
                .option("es.read.as.array.include", "commonnames")
                .option("es.nodes", nodes)
                .load("{0}/records".format(index))
                .write
                .mode("overwrite")
                .parquet("/outputs/scrap")
            )
            print("works: {0}".format(field))
        except:
            print("does not work: {0}".format(field))
            bad_field_set.add(field)


works: barcodevalue
works: basisofrecord
works: bed
works: canonicalname
works: catalognumber
works: class
works: collectioncode
works: collectionid
works: collectionname
works: collector
works: commonname
does not work: commonnames
works: continent
works: coordinateuncertainty
works: country
works: countrycode
works: county
works: data.coreid
works: data.dc:rights
works: data.dcterms:accessRights
works: data.dcterms:bibliographicCitation
works: data.dcterms:language
works: data.dcterms:license
works: data.dcterms:modified
works: data.dcterms:references
works: data.dcterms:rights
works: data.dcterms:rightsHolder
works: data.dcterms:source
works: data.dcterms:type
works: data.dwc:VerbatimEventDate
works: data.dwc:acceptedNameUsage
works: data.dwc:accessRights
works: data.dwc:associatedMedia
works: data.dwc:associatedOccurrences
works: data.dwc:associatedReferences
works: data.dwc:associatedSequences
works: data.dwc:associatedTaxa
works: data.dwc:basisOfRecord
works: data.dwc:bed
works: data.dwc:behavior
works: data.dwc:catalogNumber
works: data.dwc:class
works: data.dwc:collectionCode
works: data.dwc:collectionID
works: data.dwc:continent
works: data.dwc:coordinatePrecision
works: data.dwc:coordinateUncertaintyInMeters
works: data.dwc:country
works: data.dwc:countryCode
works: data.dwc:county
works: data.dwc:dataGeneralizations
works: data.dwc:datasetID
works: data.dwc:datasetName
works: data.dwc:dateIdentified
works: data.dwc:day
works: data.dwc:decimalLatitude
works: data.dwc:decimalLongitude
works: data.dwc:disposition
works: data.dwc:dynamicProperties
works: data.dwc:earliestAgeOrLowestStage
works: data.dwc:earliestEonOrLowestEonothem
works: data.dwc:earliestEpochOrLowestSeries
works: data.dwc:earliestEraOrLowestErathem
works: data.dwc:earliestPeriodOrLowestSystem
works: data.dwc:endDayOfYear
works: data.dwc:establishmentMeans
works: data.dwc:eventDate
works: data.dwc:eventID
works: data.dwc:eventRemarks
works: data.dwc:eventTime
works: data.dwc:family
works: data.dwc:fieldNotes
works: data.dwc:fieldNumber
works: data.dwc:footprintWKT
works: data.dwc:formation
works: data.dwc:genus
works: data.dwc:geodeticDatum
works: data.dwc:geologicalContextID
works: data.dwc:georeferenceProtocol
works: data.dwc:georeferenceRemarks
works: data.dwc:georeferenceSources
works: data.dwc:georeferenceVerificationStatus
works: data.dwc:georeferencedBy
works: data.dwc:georeferencedDate
works: data.dwc:group
works: data.dwc:habitat
works: data.dwc:higherClassification
works: data.dwc:higherGeography
works: data.dwc:higherGeographyID
works: data.dwc:highestBiostratigraphicZone
works: data.dwc:identificationID
works: data.dwc:identificationQualifier
works: data.dwc:identificationReferences
works: data.dwc:identificationRemarks
works: data.dwc:identificationVerificationStatus
works: data.dwc:identifiedBy
works: data.dwc:individualCount
works: data.dwc:individualID
works: data.dwc:informationWithheld
works: data.dwc:infraspecificEpithet
works: data.dwc:institutionCode
works: data.dwc:institutionID
works: data.dwc:island
works: data.dwc:islandGroup
works: data.dwc:kingdom
works: data.dwc:latestAgeOrHighestStage
works: data.dwc:latestEonOrHighestEonothem
works: data.dwc:latestEpochOrHighestSeries
works: data.dwc:latestEraOrHighestErathem
works: data.dwc:latestPeriodOrHighestSystem
works: data.dwc:lifeStage
works: data.dwc:lithostratigraphicTerms
works: data.dwc:locality
works: data.dwc:locationAccordingTo
works: data.dwc:locationID
works: data.dwc:locationRemarks
works: data.dwc:lowestBiostratigraphicZone
works: data.dwc:maximumDepthInMeters
works: data.dwc:maximumElevationInMeters
works: data.dwc:member
works: data.dwc:minimumDepthInMeters
works: data.dwc:minimumElevationInMeters
works: data.dwc:month
works: data.dwc:municipality
works: data.dwc:nameAccordingTo
works: data.dwc:nameAccordingToID
works: data.dwc:namePublishedIn
works: data.dwc:namePublishedInID
works: data.dwc:namePublishedInYear
works: data.dwc:nomenclaturalCode
works: data.dwc:nomenclaturalStatus
works: data.dwc:occurrenceDetails
works: data.dwc:occurrenceID
works: data.dwc:occurrenceRemarks
works: data.dwc:occurrenceStatus
works: data.dwc:order
works: data.dwc:organismID
works: data.dwc:originalNameUsage
works: data.dwc:otherCatalogNumbers
works: data.dwc:ownerInstitutionCode
works: data.dwc:parentNameUsage
works: data.dwc:phylum
works: data.dwc:preparations
works: data.dwc:previousIdentifications
works: data.dwc:recordNumber
works: data.dwc:recordedBy
works: data.dwc:reproductiveCondition
works: data.dwc:rights
works: data.dwc:rightsHolder
works: data.dwc:samplingEffort
works: data.dwc:samplingProtocol
works: data.dwc:scientificName
works: data.dwc:scientificNameAuthorship
works: data.dwc:scientificNameID
works: data.dwc:sex
works: data.dwc:specificEpithet
works: data.dwc:startDayOfYear
works: data.dwc:stateProvince
works: data.dwc:subgenus
works: data.dwc:taxonID
works: data.dwc:taxonRank
works: data.dwc:taxonRemarks
works: data.dwc:taxonomicStatus
works: data.dwc:typeStatus
works: data.dwc:verbatimCoordinateSystem
works: data.dwc:verbatimCoordinates
works: data.dwc:verbatimDepth
works: data.dwc:verbatimElevation
works: data.dwc:verbatimEventDate
works: data.dwc:verbatimLatitude
works: data.dwc:verbatimLocality
works: data.dwc:verbatimLongitude
works: data.dwc:verbatimSRS
works: data.dwc:verbatimTaxonRank
works: data.dwc:vernacularName
works: data.dwc:waterBody
works: data.dwc:year
works: data.fcc:datePicked
works: data.fcc:pickedBy
works: data.id
works: data.idigbio:preservative
works: data.idigbio:recordId
works: data.idigbio:subfamily
works: data.idigbio:substrate
works: data.idigbio:superfamily
works: data.symbiota:recordEnteredBy
works: data.symbiota:verbatimScientificName
works: datecollected
works: datemodified
works: dqs
works: earliestageorloweststage
works: earliesteonorlowesteonothem
works: earliestepochorlowestseries
works: earliesteraorlowesterathem
works: earliestperiodorlowestsystem
works: etag
works: eventdate
works: family
works: fieldnumber
does not work: flags
works: formation
works: genus
works: geologicalcontextid
works: geopoint
works: group
works: hasImage
works: hasMedia
works: highertaxon
works: highestbiostratigraphiczone
works: individualcount
works: infraspecificepithet
works: institutioncode
works: institutionid
works: institutionname
works: kingdom
works: latestageorhigheststage
works: latesteonorhighesteonothem
works: latestepochorhighestseries
works: latesteraorhighesterathem
works: latestperiodorhighestsystem
works: lithostratigraphicterms
works: locality
works: lowestbiostratigraphiczone
works: maxdepth
works: maxelevation
does not work: mediarecords
works: member
works: mindepth
works: minelevation
works: municipality
works: occurrenceid
works: order
works: phylum
does not work: recordids
works: recordnumber
works: recordset
works: scientificname
works: specificepithet
works: startdayofyear
works: stateprovince
works: taxonid
works: taxonomicstatus
works: taxonrank
works: typestatus
works: uuid
works: verbatimeventdate
works: verbatimlocality
works: version
works: waterbody

In [20]:
print(bad_field_set)


{'commonnames', 'flags', 'recordids', 'mediarecords'}

In [21]:
field_set -= bad_field_set
fields = ",".join(field_set)
df = (sqlContext.read.format("org.elasticsearch.spark.sql")
    .option("es.query", query)
    .option("es.read.field.include", fields)
    .option("es.nodes", nodes)
    .load("{0}/records".format(index))
)

In [22]:
df.printSchema()
print(df.count())
df.head(10)


root
 |-- barcodevalue: string (nullable = true)
 |-- basisofrecord: string (nullable = true)
 |-- bed: string (nullable = true)
 |-- canonicalname: string (nullable = true)
 |-- catalognumber: string (nullable = true)
 |-- class: string (nullable = true)
 |-- collectioncode: string (nullable = true)
 |-- collectionid: string (nullable = true)
 |-- collectionname: string (nullable = true)
 |-- collector: string (nullable = true)
 |-- commonname: string (nullable = true)
 |-- continent: string (nullable = true)
 |-- coordinateuncertainty: float (nullable = true)
 |-- country: string (nullable = true)
 |-- countrycode: string (nullable = true)
 |-- county: string (nullable = true)
 |-- data: struct (nullable = true)
 |    |-- coreid: string (nullable = true)
 |    |-- dc:rights: string (nullable = true)
 |    |-- dcterms:accessRights: string (nullable = true)
 |    |-- dcterms:bibliographicCitation: string (nullable = true)
 |    |-- dcterms:language: string (nullable = true)
 |    |-- dcterms:license: string (nullable = true)
 |    |-- dcterms:modified: string (nullable = true)
 |    |-- dcterms:references: string (nullable = true)
 |    |-- dcterms:rights: string (nullable = true)
 |    |-- dcterms:rightsHolder: string (nullable = true)
 |    |-- dcterms:source: string (nullable = true)
 |    |-- dcterms:type: string (nullable = true)
 |    |-- dwc:VerbatimEventDate: string (nullable = true)
 |    |-- dwc:acceptedNameUsage: string (nullable = true)
 |    |-- dwc:accessRights: string (nullable = true)
 |    |-- dwc:associatedMedia: string (nullable = true)
 |    |-- dwc:associatedOccurrences: string (nullable = true)
 |    |-- dwc:associatedReferences: string (nullable = true)
 |    |-- dwc:associatedSequences: string (nullable = true)
 |    |-- dwc:associatedTaxa: string (nullable = true)
 |    |-- dwc:basisOfRecord: string (nullable = true)
 |    |-- dwc:bed: string (nullable = true)
 |    |-- dwc:behavior: string (nullable = true)
 |    |-- dwc:catalogNumber: string (nullable = true)
 |    |-- dwc:class: string (nullable = true)
 |    |-- dwc:collectionCode: string (nullable = true)
 |    |-- dwc:collectionID: string (nullable = true)
 |    |-- dwc:continent: string (nullable = true)
 |    |-- dwc:coordinatePrecision: string (nullable = true)
 |    |-- dwc:coordinateUncertaintyInMeters: string (nullable = true)
 |    |-- dwc:country: string (nullable = true)
 |    |-- dwc:countryCode: string (nullable = true)
 |    |-- dwc:county: string (nullable = true)
 |    |-- dwc:dataGeneralizations: string (nullable = true)
 |    |-- dwc:datasetID: string (nullable = true)
 |    |-- dwc:datasetName: string (nullable = true)
 |    |-- dwc:dateIdentified: string (nullable = true)
 |    |-- dwc:day: string (nullable = true)
 |    |-- dwc:decimalLatitude: string (nullable = true)
 |    |-- dwc:decimalLongitude: string (nullable = true)
 |    |-- dwc:disposition: string (nullable = true)
 |    |-- dwc:dynamicProperties: string (nullable = true)
 |    |-- dwc:earliestAgeOrLowestStage: string (nullable = true)
 |    |-- dwc:earliestEonOrLowestEonothem: string (nullable = true)
 |    |-- dwc:earliestEpochOrLowestSeries: string (nullable = true)
 |    |-- dwc:earliestEraOrLowestErathem: string (nullable = true)
 |    |-- dwc:earliestPeriodOrLowestSystem: string (nullable = true)
 |    |-- dwc:endDayOfYear: string (nullable = true)
 |    |-- dwc:establishmentMeans: string (nullable = true)
 |    |-- dwc:eventDate: string (nullable = true)
 |    |-- dwc:eventID: string (nullable = true)
 |    |-- dwc:eventRemarks: string (nullable = true)
 |    |-- dwc:eventTime: string (nullable = true)
 |    |-- dwc:family: string (nullable = true)
 |    |-- dwc:fieldNotes: string (nullable = true)
 |    |-- dwc:fieldNumber: string (nullable = true)
 |    |-- dwc:footprintWKT: string (nullable = true)
 |    |-- dwc:formation: string (nullable = true)
 |    |-- dwc:genus: string (nullable = true)
 |    |-- dwc:geodeticDatum: string (nullable = true)
 |    |-- dwc:geologicalContextID: string (nullable = true)
 |    |-- dwc:georeferenceProtocol: string (nullable = true)
 |    |-- dwc:georeferenceRemarks: string (nullable = true)
 |    |-- dwc:georeferenceSources: string (nullable = true)
 |    |-- dwc:georeferenceVerificationStatus: string (nullable = true)
 |    |-- dwc:georeferencedBy: string (nullable = true)
 |    |-- dwc:georeferencedDate: string (nullable = true)
 |    |-- dwc:group: string (nullable = true)
 |    |-- dwc:habitat: string (nullable = true)
 |    |-- dwc:higherClassification: string (nullable = true)
 |    |-- dwc:higherGeography: string (nullable = true)
 |    |-- dwc:higherGeographyID: string (nullable = true)
 |    |-- dwc:highestBiostratigraphicZone: string (nullable = true)
 |    |-- dwc:identificationID: string (nullable = true)
 |    |-- dwc:identificationQualifier: string (nullable = true)
 |    |-- dwc:identificationReferences: string (nullable = true)
 |    |-- dwc:identificationRemarks: string (nullable = true)
 |    |-- dwc:identificationVerificationStatus: string (nullable = true)
 |    |-- dwc:identifiedBy: string (nullable = true)
 |    |-- dwc:individualCount: string (nullable = true)
 |    |-- dwc:individualID: string (nullable = true)
 |    |-- dwc:informationWithheld: string (nullable = true)
 |    |-- dwc:infraspecificEpithet: string (nullable = true)
 |    |-- dwc:institutionCode: string (nullable = true)
 |    |-- dwc:institutionID: string (nullable = true)
 |    |-- dwc:island: string (nullable = true)
 |    |-- dwc:islandGroup: string (nullable = true)
 |    |-- dwc:kingdom: string (nullable = true)
 |    |-- dwc:latestAgeOrHighestStage: string (nullable = true)
 |    |-- dwc:latestEonOrHighestEonothem: string (nullable = true)
 |    |-- dwc:latestEpochOrHighestSeries: string (nullable = true)
 |    |-- dwc:latestEraOrHighestErathem: string (nullable = true)
 |    |-- dwc:latestPeriodOrHighestSystem: string (nullable = true)
 |    |-- dwc:lifeStage: string (nullable = true)
 |    |-- dwc:lithostratigraphicTerms: string (nullable = true)
 |    |-- dwc:locality: string (nullable = true)
 |    |-- dwc:locationAccordingTo: string (nullable = true)
 |    |-- dwc:locationID: string (nullable = true)
 |    |-- dwc:locationRemarks: string (nullable = true)
 |    |-- dwc:lowestBiostratigraphicZone: string (nullable = true)
 |    |-- dwc:maximumDepthInMeters: string (nullable = true)
 |    |-- dwc:maximumElevationInMeters: string (nullable = true)
 |    |-- dwc:member: string (nullable = true)
 |    |-- dwc:minimumDepthInMeters: string (nullable = true)
 |    |-- dwc:minimumElevationInMeters: string (nullable = true)
 |    |-- dwc:month: string (nullable = true)
 |    |-- dwc:municipality: string (nullable = true)
 |    |-- dwc:nameAccordingTo: string (nullable = true)
 |    |-- dwc:nameAccordingToID: string (nullable = true)
 |    |-- dwc:namePublishedIn: string (nullable = true)
 |    |-- dwc:namePublishedInID: string (nullable = true)
 |    |-- dwc:namePublishedInYear: string (nullable = true)
 |    |-- dwc:nomenclaturalCode: string (nullable = true)
 |    |-- dwc:nomenclaturalStatus: string (nullable = true)
 |    |-- dwc:occurrenceDetails: string (nullable = true)
 |    |-- dwc:occurrenceID: string (nullable = true)
 |    |-- dwc:occurrenceRemarks: string (nullable = true)
 |    |-- dwc:occurrenceStatus: string (nullable = true)
 |    |-- dwc:order: string (nullable = true)
 |    |-- dwc:organismID: string (nullable = true)
 |    |-- dwc:originalNameUsage: string (nullable = true)
 |    |-- dwc:otherCatalogNumbers: string (nullable = true)
 |    |-- dwc:ownerInstitutionCode: string (nullable = true)
 |    |-- dwc:parentNameUsage: string (nullable = true)
 |    |-- dwc:phylum: string (nullable = true)
 |    |-- dwc:preparations: string (nullable = true)
 |    |-- dwc:previousIdentifications: string (nullable = true)
 |    |-- dwc:recordNumber: string (nullable = true)
 |    |-- dwc:recordedBy: string (nullable = true)
 |    |-- dwc:reproductiveCondition: string (nullable = true)
 |    |-- dwc:rights: string (nullable = true)
 |    |-- dwc:rightsHolder: string (nullable = true)
 |    |-- dwc:samplingEffort: string (nullable = true)
 |    |-- dwc:samplingProtocol: string (nullable = true)
 |    |-- dwc:scientificName: string (nullable = true)
 |    |-- dwc:scientificNameAuthorship: string (nullable = true)
 |    |-- dwc:scientificNameID: string (nullable = true)
 |    |-- dwc:sex: string (nullable = true)
 |    |-- dwc:specificEpithet: string (nullable = true)
 |    |-- dwc:startDayOfYear: string (nullable = true)
 |    |-- dwc:stateProvince: string (nullable = true)
 |    |-- dwc:subgenus: string (nullable = true)
 |    |-- dwc:taxonID: string (nullable = true)
 |    |-- dwc:taxonRank: string (nullable = true)
 |    |-- dwc:taxonRemarks: string (nullable = true)
 |    |-- dwc:taxonomicStatus: string (nullable = true)
 |    |-- dwc:typeStatus: string (nullable = true)
 |    |-- dwc:verbatimCoordinateSystem: string (nullable = true)
 |    |-- dwc:verbatimCoordinates: string (nullable = true)
 |    |-- dwc:verbatimDepth: string (nullable = true)
 |    |-- dwc:verbatimElevation: string (nullable = true)
 |    |-- dwc:verbatimEventDate: string (nullable = true)
 |    |-- dwc:verbatimLatitude: string (nullable = true)
 |    |-- dwc:verbatimLocality: string (nullable = true)
 |    |-- dwc:verbatimLongitude: string (nullable = true)
 |    |-- dwc:verbatimSRS: string (nullable = true)
 |    |-- dwc:verbatimTaxonRank: string (nullable = true)
 |    |-- dwc:vernacularName: string (nullable = true)
 |    |-- dwc:waterBody: string (nullable = true)
 |    |-- dwc:year: string (nullable = true)
 |    |-- fcc:datePicked: string (nullable = true)
 |    |-- fcc:pickedBy: string (nullable = true)
 |    |-- id: string (nullable = true)
 |    |-- idigbio:preservative: string (nullable = true)
 |    |-- idigbio:recordId: string (nullable = true)
 |    |-- idigbio:subfamily: string (nullable = true)
 |    |-- idigbio:substrate: string (nullable = true)
 |    |-- idigbio:superfamily: string (nullable = true)
 |    |-- symbiota:recordEnteredBy: string (nullable = true)
 |    |-- symbiota:verbatimScientificName: string (nullable = true)
 |-- datecollected: timestamp (nullable = true)
 |-- datemodified: timestamp (nullable = true)
 |-- dqs: float (nullable = true)
 |-- earliestageorloweststage: string (nullable = true)
 |-- earliesteonorlowesteonothem: string (nullable = true)
 |-- earliestepochorlowestseries: string (nullable = true)
 |-- earliesteraorlowesterathem: string (nullable = true)
 |-- earliestperiodorlowestsystem: string (nullable = true)
 |-- etag: string (nullable = true)
 |-- eventdate: string (nullable = true)
 |-- family: string (nullable = true)
 |-- fieldnumber: string (nullable = true)
 |-- formation: string (nullable = true)
 |-- genus: string (nullable = true)
 |-- geologicalcontextid: string (nullable = true)
 |-- geopoint: struct (nullable = true)
 |    |-- lat: double (nullable = true)
 |    |-- lon: double (nullable = true)
 |-- group: string (nullable = true)
 |-- hasImage: boolean (nullable = true)
 |-- hasMedia: boolean (nullable = true)
 |-- highertaxon: string (nullable = true)
 |-- highestbiostratigraphiczone: string (nullable = true)
 |-- individualcount: float (nullable = true)
 |-- infraspecificepithet: string (nullable = true)
 |-- institutioncode: string (nullable = true)
 |-- institutionid: string (nullable = true)
 |-- institutionname: string (nullable = true)
 |-- kingdom: string (nullable = true)
 |-- latestageorhigheststage: string (nullable = true)
 |-- latesteonorhighesteonothem: string (nullable = true)
 |-- latestepochorhighestseries: string (nullable = true)
 |-- latesteraorhighesterathem: string (nullable = true)
 |-- latestperiodorhighestsystem: string (nullable = true)
 |-- lithostratigraphicterms: string (nullable = true)
 |-- locality: string (nullable = true)
 |-- lowestbiostratigraphiczone: string (nullable = true)
 |-- maxdepth: float (nullable = true)
 |-- maxelevation: float (nullable = true)
 |-- member: string (nullable = true)
 |-- mindepth: float (nullable = true)
 |-- minelevation: float (nullable = true)
 |-- municipality: string (nullable = true)
 |-- occurrenceid: string (nullable = true)
 |-- order: string (nullable = true)
 |-- phylum: string (nullable = true)
 |-- recordnumber: string (nullable = true)
 |-- recordset: string (nullable = true)
 |-- scientificname: string (nullable = true)
 |-- specificepithet: string (nullable = true)
 |-- startdayofyear: integer (nullable = true)
 |-- stateprovince: string (nullable = true)
 |-- taxonid: string (nullable = true)
 |-- taxonomicstatus: string (nullable = true)
 |-- taxonrank: string (nullable = true)
 |-- typestatus: string (nullable = true)
 |-- uuid: string (nullable = true)
 |-- verbatimeventdate: string (nullable = true)
 |-- verbatimlocality: string (nullable = true)
 |-- version: integer (nullable = true)
 |-- waterbody: string (nullable = true)

447
Out[22]:
[Row(barcodevalue=None, basisofrecord='preservedspecimen', bed=None, canonicalname='acer dubium', catalognumber='1730298', class='magnoliopsida', collectioncode='botany', collectionid=None, collectionname=None, collector='w. r. adams', commonname=None, continent='north america', coordinateuncertainty=None, country='united states', countrycode='usa', county='chittenden county', data=Row(coreid=None, dc:rights=None, dcterms:accessRights=None, dcterms:bibliographicCitation=None, dcterms:language=None, dcterms:license=None, dcterms:modified=None, dcterms:references=None, dcterms:rights='https://creativecommons.org/publicdomain/zero/1.0/', dcterms:rightsHolder=None, dcterms:source=None, dcterms:type='PhysicalObject', dwc:VerbatimEventDate=None, dwc:acceptedNameUsage=None, dwc:accessRights=None, dwc:associatedMedia=None, dwc:associatedOccurrences=None, dwc:associatedReferences=None, dwc:associatedSequences=None, dwc:associatedTaxa=None, dwc:basisOfRecord='PreservedSpecimen', dwc:bed=None, dwc:behavior=None, dwc:catalogNumber='1730298', dwc:class='Dicotyledonae', dwc:collectionCode='Botany', dwc:collectionID=None, dwc:continent='North America', dwc:coordinatePrecision=None, dwc:coordinateUncertaintyInMeters=None, dwc:country='United States', dwc:countryCode=None, dwc:county='Chittenden County', dwc:dataGeneralizations=None, dwc:datasetID=None, dwc:datasetName=None, dwc:dateIdentified=None, dwc:day='10', dwc:decimalLatitude=None, dwc:decimalLongitude=None, dwc:disposition=None, dwc:dynamicProperties=None, dwc:earliestAgeOrLowestStage=None, dwc:earliestEonOrLowestEonothem=None, dwc:earliestEpochOrLowestSeries=None, dwc:earliestEraOrLowestErathem=None, dwc:earliestPeriodOrLowestSystem=None, dwc:endDayOfYear='284', dwc:establishmentMeans=None, dwc:eventDate=None, dwc:eventID=None, dwc:eventRemarks=None, dwc:eventTime=None, dwc:family='Aceraceae', dwc:fieldNotes=None, dwc:fieldNumber=None, dwc:footprintWKT=None, dwc:formation=None, dwc:genus='Acer', dwc:geodeticDatum=None, dwc:geologicalContextID=None, dwc:georeferenceProtocol=None, dwc:georeferenceRemarks=None, dwc:georeferenceSources=None, dwc:georeferenceVerificationStatus=None, dwc:georeferencedBy=None, dwc:georeferencedDate=None, dwc:group=None, dwc:habitat='Well drained sandy soil', dwc:higherClassification='Plantae, Dicotyledonae, Sapindales, Aceraceae', dwc:higherGeography='North America, United States, Vermont, Chittenden County', dwc:higherGeographyID=None, dwc:highestBiostratigraphicZone=None, dwc:identificationID=None, dwc:identificationQualifier=None, dwc:identificationReferences=None, dwc:identificationRemarks=None, dwc:identificationVerificationStatus=None, dwc:identifiedBy='Ellis, W. H.', dwc:individualCount='1', dwc:individualID=None, dwc:informationWithheld=None, dwc:infraspecificEpithet=None, dwc:institutionCode='US', dwc:institutionID=None, dwc:island=None, dwc:islandGroup=None, dwc:kingdom='Plantae', dwc:latestAgeOrHighestStage=None, dwc:latestEonOrHighestEonothem=None, dwc:latestEpochOrHighestSeries=None, dwc:latestEraOrHighestErathem=None, dwc:latestPeriodOrHighestSystem=None, dwc:lifeStage='Flowering', dwc:lithostratigraphicTerms=None, dwc:locality='Burlington', dwc:locationAccordingTo=None, dwc:locationID=None, dwc:locationRemarks=None, dwc:lowestBiostratigraphicZone=None, dwc:maximumDepthInMeters=None, dwc:maximumElevationInMeters=None, dwc:member=None, dwc:minimumDepthInMeters=None, dwc:minimumElevationInMeters=None, dwc:month='10', dwc:municipality=None, dwc:nameAccordingTo=None, dwc:nameAccordingToID=None, dwc:namePublishedIn=None, dwc:namePublishedInID=None, dwc:namePublishedInYear=None, dwc:nomenclaturalCode=None, dwc:nomenclaturalStatus=None, dwc:occurrenceDetails=None, dwc:occurrenceID='http://n2t.net/ark:/65665/31b0dc309-c955-488e-85bb-702b128bedaa', dwc:occurrenceRemarks=None, dwc:occurrenceStatus=None, dwc:order='Sapindales', dwc:organismID=None, dwc:originalNameUsage=None, dwc:otherCatalogNumbers=None, dwc:ownerInstitutionCode=None, dwc:parentNameUsage=None, dwc:phylum=None, dwc:preparations=None, dwc:previousIdentifications=None, dwc:recordNumber='8277', dwc:recordedBy='W. R. Adams', dwc:reproductiveCondition=None, dwc:rights=None, dwc:rightsHolder=None, dwc:samplingEffort=None, dwc:samplingProtocol=None, dwc:scientificName='Acer rubrum', dwc:scientificNameAuthorship='L.', dwc:scientificNameID=None, dwc:sex=None, dwc:specificEpithet='rubrum', dwc:startDayOfYear='284', dwc:stateProvince='Vermont', dwc:subgenus=None, dwc:taxonID=None, dwc:taxonRank=None, dwc:taxonRemarks=None, dwc:taxonomicStatus=None, dwc:typeStatus=None, dwc:verbatimCoordinateSystem=None, dwc:verbatimCoordinates=None, dwc:verbatimDepth=None, dwc:verbatimElevation=None, dwc:verbatimEventDate=None, dwc:verbatimLatitude=None, dwc:verbatimLocality=None, dwc:verbatimLongitude=None, dwc:verbatimSRS=None, dwc:verbatimTaxonRank=None, dwc:vernacularName=None, dwc:waterBody=None, dwc:year='1936', fcc:datePicked=None, fcc:pickedBy=None, id='http://n2t.net/ark:/65665/31b0dc309-c955-488e-85bb-702b128bedaa', idigbio:preservative=None, idigbio:recordId=None, idigbio:subfamily=None, idigbio:substrate=None, idigbio:superfamily=None, symbiota:recordEnteredBy=None, symbiota:verbatimScientificName=None), datecollected=datetime.datetime(1936, 10, 10, 0, 0), datemodified=datetime.datetime(2016, 9, 22, 10, 42, 32, 961000), dqs=0.20895522832870483, earliestageorloweststage=None, earliesteonorlowesteonothem=None, earliestepochorlowestseries=None, earliesteraorlowesterathem=None, earliestperiodorlowestsystem=None, etag='fa592a64674aab0fb00db6bf5903a1420d96e602', eventdate=None, family='sapindaceae', fieldnumber=None, formation=None, genus='acer', geologicalcontextid=None, geopoint=None, group=None, hasImage=False, hasMedia=False, highertaxon='plantae, dicotyledonae, sapindales, aceraceae', highestbiostratigraphiczone=None, individualcount=1.0, infraspecificepithet=None, institutioncode='us', institutionid=None, institutionname=None, kingdom='plantae', latestageorhigheststage=None, latesteonorhighesteonothem=None, latestepochorhighestseries=None, latesteraorhighesterathem=None, latestperiodorhighestsystem=None, lithostratigraphicterms=None, locality='burlington', lowestbiostratigraphiczone=None, maxdepth=None, maxelevation=None, member=None, mindepth=None, minelevation=None, municipality=None, occurrenceid='http://n2t.net/ark:/65665/31b0dc309-c955-488e-85bb-702b128bedaa', order='sapindales', phylum='tracheophyta', recordnumber='8277', recordset='a6eee223-cf3b-4079-8bb2-b77dad8cae9d', scientificname='acer rubrum', specificepithet='rubrum', startdayofyear=284, stateprovince='vermont', taxonid='4924460', taxonomicstatus='accepted', taxonrank='species', typestatus=None, uuid='1e7d0cef-515f-435a-95d9-0511d31a7aaf', verbatimeventdate=None, verbatimlocality=None, version=None, waterbody=None),
 Row(barcodevalue=None, basisofrecord='preservedspecimen', bed=None, canonicalname='acer pensylvanicum l.', catalognumber='conn00078708', class='magnoliopsida', collectioncode='conn', collectionid=None, collectionname=None, collector='w. w. eggleston', commonname='moosewood; snake-bark maple; striped maple', continent='north america', coordinateuncertainty=20000.0, country='united states', countrycode='usa', county='rutland county', data=Row(coreid=None, dc:rights=None, dcterms:accessRights=None, dcterms:bibliographicCitation=None, dcterms:language=None, dcterms:license=None, dcterms:modified='2009-05-21T00:00-0500', dcterms:references=None, dcterms:rights='This work is licensed under a Creative Commons CCZero 1.0 License http://i.creativecommons.org/l/by-nc-sa/4.0/88x31.png', dcterms:rightsHolder=None, dcterms:source=None, dcterms:type=None, dwc:VerbatimEventDate=None, dwc:acceptedNameUsage=None, dwc:accessRights=None, dwc:associatedMedia=None, dwc:associatedOccurrences=None, dwc:associatedReferences=None, dwc:associatedSequences=None, dwc:associatedTaxa=None, dwc:basisOfRecord='Preserved Specimen', dwc:bed=None, dwc:behavior=None, dwc:catalogNumber='CONN00078708', dwc:class=None, dwc:collectionCode='CONN', dwc:collectionID=None, dwc:continent=None, dwc:coordinatePrecision=None, dwc:coordinateUncertaintyInMeters='20000', dwc:country='USA', dwc:countryCode='US', dwc:county='Rutland County', dwc:dataGeneralizations=None, dwc:datasetID='68732', dwc:datasetName=None, dwc:dateIdentified=None, dwc:day='16', dwc:decimalLatitude='43.60444', dwc:decimalLongitude='-72.82055', dwc:disposition=None, dwc:dynamicProperties=None, dwc:earliestAgeOrLowestStage=None, dwc:earliestEonOrLowestEonothem=None, dwc:earliestEpochOrLowestSeries=None, dwc:earliestEraOrLowestErathem=None, dwc:earliestPeriodOrLowestSystem=None, dwc:endDayOfYear=None, dwc:establishmentMeans=None, dwc:eventDate='1897-05-16', dwc:eventID=None, dwc:eventRemarks=None, dwc:eventTime=None, dwc:family='Aceraceae', dwc:fieldNotes=None, dwc:fieldNumber=None, dwc:footprintWKT=None, dwc:formation=None, dwc:genus='Acer', dwc:geodeticDatum=None, dwc:geologicalContextID=None, dwc:georeferenceProtocol=None, dwc:georeferenceRemarks=None, dwc:georeferenceSources=None, dwc:georeferenceVerificationStatus=None, dwc:georeferencedBy=None, dwc:georeferencedDate=None, dwc:group=None, dwc:habitat=None, dwc:higherClassification='Plantae; Dicotyledonae; Sapindales; Aceraceae', dwc:higherGeography='USA; Vermont; Rutland County; Mendon', dwc:higherGeographyID=None, dwc:highestBiostratigraphicZone=None, dwc:identificationID=None, dwc:identificationQualifier=None, dwc:identificationReferences=None, dwc:identificationRemarks=None, dwc:identificationVerificationStatus=None, dwc:identifiedBy=None, dwc:individualCount=None, dwc:individualID=None, dwc:informationWithheld=None, dwc:infraspecificEpithet=None, dwc:institutionCode='UConn', dwc:institutionID=None, dwc:island=None, dwc:islandGroup=None, dwc:kingdom='Dicotyledonae', dwc:latestAgeOrHighestStage=None, dwc:latestEonOrHighestEonothem=None, dwc:latestEpochOrHighestSeries=None, dwc:latestEraOrHighestErathem=None, dwc:latestPeriodOrHighestSystem=None, dwc:lifeStage=None, dwc:lithostratigraphicTerms=None, dwc:locality='Mendon', dwc:locationAccordingTo=None, dwc:locationID=None, dwc:locationRemarks=None, dwc:lowestBiostratigraphicZone=None, dwc:maximumDepthInMeters=None, dwc:maximumElevationInMeters=None, dwc:member=None, dwc:minimumDepthInMeters=None, dwc:minimumElevationInMeters=None, dwc:month='5', dwc:municipality='Mendon', dwc:nameAccordingTo=None, dwc:nameAccordingToID=None, dwc:namePublishedIn=None, dwc:namePublishedInID=None, dwc:namePublishedInYear=None, dwc:nomenclaturalCode=None, dwc:nomenclaturalStatus=None, dwc:occurrenceDetails=None, dwc:occurrenceID='urn:catalog:UConn:CONN:CONN00078708', dwc:occurrenceRemarks='pistillate flowers, stamminate flowers', dwc:occurrenceStatus=None, dwc:order='Sapindales', dwc:organismID=None, dwc:originalNameUsage=None, dwc:otherCatalogNumbers=None, dwc:ownerInstitutionCode=None, dwc:parentNameUsage=None, dwc:phylum=None, dwc:preparations=None, dwc:previousIdentifications='Acer pensylvanicum L.', dwc:recordNumber=None, dwc:recordedBy='W. W. Eggleston', dwc:reproductiveCondition='fruiting', dwc:rights=None, dwc:rightsHolder=None, dwc:samplingEffort=None, dwc:samplingProtocol=None, dwc:scientificName='Acer pensylvanicum L.', dwc:scientificNameAuthorship=None, dwc:scientificNameID=None, dwc:sex=None, dwc:specificEpithet='pensylvanicum', dwc:startDayOfYear=None, dwc:stateProvince='Vermont', dwc:subgenus=None, dwc:taxonID=None, dwc:taxonRank=None, dwc:taxonRemarks=None, dwc:taxonomicStatus=None, dwc:typeStatus=None, dwc:verbatimCoordinateSystem=None, dwc:verbatimCoordinates=None, dwc:verbatimDepth=None, dwc:verbatimElevation=None, dwc:verbatimEventDate='16 May 1897', dwc:verbatimLatitude='43°36\' 16" N', dwc:verbatimLocality=None, dwc:verbatimLongitude='72°49\' 14" W', dwc:verbatimSRS=None, dwc:verbatimTaxonRank=None, dwc:vernacularName='Moosewood; Snake-Bark Maple; Striped Maple', dwc:waterBody=None, dwc:year='1897', fcc:datePicked=None, fcc:pickedBy=None, id=None, idigbio:preservative=None, idigbio:recordId=None, idigbio:subfamily=None, idigbio:substrate=None, idigbio:superfamily=None, symbiota:recordEnteredBy=None, symbiota:verbatimScientificName=None), datecollected=datetime.datetime(1897, 5, 15, 19, 0), datemodified=datetime.datetime(2014, 9, 12, 15, 10, 56, 798000), dqs=0.2238806039094925, earliestageorloweststage=None, earliesteonorlowesteonothem=None, earliestepochorlowestseries=None, earliesteraorlowesterathem=None, earliestperiodorlowestsystem=None, etag='f146b6242c77076d6b42bef3bf576ea91243033c', eventdate='1897-05-16', family='sapindaceae', fieldnumber=None, formation=None, genus='acer', geologicalcontextid=None, geopoint=Row(lat=43.60444, lon=-72.82055), group=None, hasImage=True, hasMedia=True, highertaxon='plantae; dicotyledonae; sapindales; aceraceae', highestbiostratigraphiczone=None, individualcount=None, infraspecificepithet=None, institutioncode='uconn', institutionid=None, institutionname=None, kingdom='plantae', latestageorhigheststage=None, latesteonorhighesteonothem=None, latestepochorhighestseries=None, latesteraorhighesterathem=None, latestperiodorhighestsystem=None, lithostratigraphicterms=None, locality='mendon', lowestbiostratigraphiczone=None, maxdepth=None, maxelevation=None, member=None, mindepth=None, minelevation=None, municipality='mendon', occurrenceid='urn:catalog:uconn:conn:conn00078708', order='sapindales', phylum='tracheophyta', recordnumber=None, recordset='e70af26a-fb9e-43ab-96a0-d62a2df37e6d', scientificname='acer pensylvanicum l.', specificepithet='pensylvanicum', startdayofyear=136, stateprovince='vermont', taxonid='3189836', taxonomicstatus='accepted', taxonrank='species', typestatus=None, uuid='15b6921e-340d-4216-85b8-13f2207d22d1', verbatimeventdate='16 may 1897', verbatimlocality=None, version=None, waterbody=None),
 Row(barcodevalue=None, basisofrecord='preservedspecimen', bed=None, canonicalname='acer pensylvanicum l.', catalognumber='17959', class='magnoliopsida', collectioncode='botany', collectionid=None, collectionname=None, collector='c. g. pringle', commonname=None, continent='north america', coordinateuncertainty=None, country='united states', countrycode='usa', county=None, data=Row(coreid=None, dc:rights=None, dcterms:accessRights=None, dcterms:bibliographicCitation=None, dcterms:language=None, dcterms:license=None, dcterms:modified=None, dcterms:references=None, dcterms:rights='https://creativecommons.org/publicdomain/zero/1.0/', dcterms:rightsHolder=None, dcterms:source=None, dcterms:type='PhysicalObject', dwc:VerbatimEventDate=None, dwc:acceptedNameUsage=None, dwc:accessRights=None, dwc:associatedMedia=None, dwc:associatedOccurrences=None, dwc:associatedReferences=None, dwc:associatedSequences=None, dwc:associatedTaxa=None, dwc:basisOfRecord='PreservedSpecimen', dwc:bed=None, dwc:behavior=None, dwc:catalogNumber='17959', dwc:class='Dicotyledonae', dwc:collectionCode='Botany', dwc:collectionID=None, dwc:continent='North America', dwc:coordinatePrecision=None, dwc:coordinateUncertaintyInMeters=None, dwc:country='United States', dwc:countryCode=None, dwc:county=None, dwc:dataGeneralizations=None, dwc:datasetID=None, dwc:datasetName=None, dwc:dateIdentified=None, dwc:day='8', dwc:decimalLatitude=None, dwc:decimalLongitude=None, dwc:disposition=None, dwc:dynamicProperties=None, dwc:earliestAgeOrLowestStage=None, dwc:earliestEonOrLowestEonothem=None, dwc:earliestEpochOrLowestSeries=None, dwc:earliestEraOrLowestErathem=None, dwc:earliestPeriodOrLowestSystem=None, dwc:endDayOfYear='159', dwc:establishmentMeans=None, dwc:eventDate=None, dwc:eventID=None, dwc:eventRemarks=None, dwc:eventTime=None, dwc:family='Aceraceae', dwc:fieldNotes=None, dwc:fieldNumber=None, dwc:footprintWKT=None, dwc:formation=None, dwc:genus='Acer', dwc:geodeticDatum=None, dwc:geologicalContextID=None, dwc:georeferenceProtocol=None, dwc:georeferenceRemarks=None, dwc:georeferenceSources=None, dwc:georeferenceVerificationStatus=None, dwc:georeferencedBy=None, dwc:georeferencedDate=None, dwc:group=None, dwc:habitat='Mountain woods', dwc:higherClassification='Plantae, Dicotyledonae, Sapindales, Aceraceae', dwc:higherGeography='North America, United States, Vermont', dwc:higherGeographyID=None, dwc:highestBiostratigraphicZone=None, dwc:identificationID=None, dwc:identificationQualifier=None, dwc:identificationReferences=None, dwc:identificationRemarks=None, dwc:identificationVerificationStatus=None, dwc:identifiedBy=None, dwc:individualCount='1', dwc:individualID=None, dwc:informationWithheld=None, dwc:infraspecificEpithet=None, dwc:institutionCode='US', dwc:institutionID=None, dwc:island=None, dwc:islandGroup=None, dwc:kingdom='Plantae', dwc:latestAgeOrHighestStage=None, dwc:latestEonOrHighestEonothem=None, dwc:latestEpochOrHighestSeries=None, dwc:latestEraOrHighestErathem=None, dwc:latestPeriodOrHighestSystem=None, dwc:lifeStage='Fruiting', dwc:lithostratigraphicTerms=None, dwc:locality=None, dwc:locationAccordingTo=None, dwc:locationID=None, dwc:locationRemarks=None, dwc:lowestBiostratigraphicZone=None, dwc:maximumDepthInMeters=None, dwc:maximumElevationInMeters=None, dwc:member=None, dwc:minimumDepthInMeters=None, dwc:minimumElevationInMeters=None, dwc:month='6', dwc:municipality=None, dwc:nameAccordingTo=None, dwc:nameAccordingToID=None, dwc:namePublishedIn=None, dwc:namePublishedInID=None, dwc:namePublishedInYear=None, dwc:nomenclaturalCode=None, dwc:nomenclaturalStatus=None, dwc:occurrenceDetails=None, dwc:occurrenceID='http://n2t.net/ark:/65665/3ca016bc8-3c19-4166-8c0f-5f360a64d262', dwc:occurrenceRemarks=None, dwc:occurrenceStatus=None, dwc:order='Sapindales', dwc:organismID=None, dwc:originalNameUsage=None, dwc:otherCatalogNumbers=None, dwc:ownerInstitutionCode=None, dwc:parentNameUsage=None, dwc:phylum=None, dwc:preparations=None, dwc:previousIdentifications=None, dwc:recordNumber='s.n.', dwc:recordedBy='C. G. Pringle', dwc:reproductiveCondition=None, dwc:rights=None, dwc:rightsHolder=None, dwc:samplingEffort=None, dwc:samplingProtocol=None, dwc:scientificName='Acer pensylvanicum', dwc:scientificNameAuthorship='L.', dwc:scientificNameID=None, dwc:sex=None, dwc:specificEpithet='pensylvanicum', dwc:startDayOfYear='159', dwc:stateProvince='Vermont', dwc:subgenus=None, dwc:taxonID=None, dwc:taxonRank=None, dwc:taxonRemarks=None, dwc:taxonomicStatus=None, dwc:typeStatus=None, dwc:verbatimCoordinateSystem=None, dwc:verbatimCoordinates=None, dwc:verbatimDepth=None, dwc:verbatimElevation=None, dwc:verbatimEventDate='fr [?] October', dwc:verbatimLatitude=None, dwc:verbatimLocality=None, dwc:verbatimLongitude=None, dwc:verbatimSRS=None, dwc:verbatimTaxonRank=None, dwc:vernacularName=None, dwc:waterBody=None, dwc:year='1877', fcc:datePicked=None, fcc:pickedBy=None, id='http://n2t.net/ark:/65665/3ca016bc8-3c19-4166-8c0f-5f360a64d262', idigbio:preservative=None, idigbio:recordId=None, idigbio:subfamily=None, idigbio:substrate=None, idigbio:superfamily=None, symbiota:recordEnteredBy=None, symbiota:verbatimScientificName=None), datecollected=datetime.datetime(1877, 6, 8, 0, 0), datemodified=datetime.datetime(2016, 9, 22, 10, 42, 32, 961000), dqs=0.19402985274791718, earliestageorloweststage=None, earliesteonorlowesteonothem=None, earliestepochorlowestseries=None, earliesteraorlowesterathem=None, earliestperiodorlowestsystem=None, etag='4c8a89d61259980b32f109c4f660edf3f2f05b06', eventdate=None, family='sapindaceae', fieldnumber=None, formation=None, genus='acer', geologicalcontextid=None, geopoint=None, group=None, hasImage=False, hasMedia=False, highertaxon='plantae, dicotyledonae, sapindales, aceraceae', highestbiostratigraphiczone=None, individualcount=1.0, infraspecificepithet=None, institutioncode='us', institutionid=None, institutionname=None, kingdom='plantae', latestageorhigheststage=None, latesteonorhighesteonothem=None, latestepochorhighestseries=None, latesteraorhighesterathem=None, latestperiodorhighestsystem=None, lithostratigraphicterms=None, locality=None, lowestbiostratigraphiczone=None, maxdepth=None, maxelevation=None, member=None, mindepth=None, minelevation=None, municipality=None, occurrenceid='http://n2t.net/ark:/65665/3ca016bc8-3c19-4166-8c0f-5f360a64d262', order='sapindales', phylum='tracheophyta', recordnumber='s.n.', recordset='a6eee223-cf3b-4079-8bb2-b77dad8cae9d', scientificname='acer pensylvanicum', specificepithet='pensylvanicum', startdayofyear=159, stateprovince='vermont', taxonid='3189836', taxonomicstatus='accepted', taxonrank='species', typestatus=None, uuid='03507aa9-f926-4513-a980-8071dbc69fc1', verbatimeventdate='fr [?] october', verbatimlocality=None, version=None, waterbody=None),
 Row(barcodevalue=None, basisofrecord='preservedspecimen', bed=None, canonicalname='acer pensylvanicum l.', catalognumber='conn00078687', class='magnoliopsida', collectioncode='conn', collectionid=None, collectionname=None, collector='"g.s. torrey, g. mehlquist & a.f. hill"', commonname='moosewood; snake-bark maple; striped maple', continent='north america', coordinateuncertainty=20000.0, country='united states', countrycode='usa', county='lamoille county', data=Row(coreid=None, dc:rights=None, dcterms:accessRights=None, dcterms:bibliographicCitation=None, dcterms:language=None, dcterms:license=None, dcterms:modified='2012-04-06T00:00-0500', dcterms:references=None, dcterms:rights='This work is licensed under a Creative Commons CCZero 1.0 License http://i.creativecommons.org/l/by-nc-sa/4.0/88x31.png', dcterms:rightsHolder=None, dcterms:source=None, dcterms:type=None, dwc:VerbatimEventDate=None, dwc:acceptedNameUsage=None, dwc:accessRights=None, dwc:associatedMedia=None, dwc:associatedOccurrences=None, dwc:associatedReferences=None, dwc:associatedSequences=None, dwc:associatedTaxa=None, dwc:basisOfRecord='Preserved Specimen', dwc:bed=None, dwc:behavior=None, dwc:catalogNumber='CONN00078687', dwc:class=None, dwc:collectionCode='CONN', dwc:collectionID=None, dwc:continent=None, dwc:coordinatePrecision=None, dwc:coordinateUncertaintyInMeters='20000', dwc:country='USA', dwc:countryCode='US', dwc:county='Lamoille County', dwc:dataGeneralizations=None, dwc:datasetID='68712', dwc:datasetName=None, dwc:dateIdentified=None, dwc:day='24', dwc:decimalLatitude='44.54361', dwc:decimalLongitude='-72.81416', dwc:disposition=None, dwc:dynamicProperties=None, dwc:earliestAgeOrLowestStage=None, dwc:earliestEonOrLowestEonothem=None, dwc:earliestEpochOrLowestSeries=None, dwc:earliestEraOrLowestErathem=None, dwc:earliestPeriodOrLowestSystem=None, dwc:endDayOfYear=None, dwc:establishmentMeans=None, dwc:eventDate='1935-07-24', dwc:eventID=None, dwc:eventRemarks=None, dwc:eventTime=None, dwc:family='Aceraceae', dwc:fieldNotes=None, dwc:fieldNumber=None, dwc:footprintWKT=None, dwc:formation=None, dwc:genus='Acer', dwc:geodeticDatum=None, dwc:geologicalContextID=None, dwc:georeferenceProtocol=None, dwc:georeferenceRemarks=None, dwc:georeferenceSources='no date. USGS Geographic Names Information System (GNIS). U. S. Geological Survey.', dwc:georeferenceVerificationStatus=None, dwc:georeferencedBy=None, dwc:georeferencedDate=None, dwc:group=None, dwc:habitat=None, dwc:higherClassification='Plantae; Dicotyledonae; Sapindales; Aceraceae', dwc:higherGeography='USA; Vermont; Lamoille County; Cambridge', dwc:higherGeographyID=None, dwc:highestBiostratigraphicZone=None, dwc:identificationID=None, dwc:identificationQualifier=None, dwc:identificationReferences=None, dwc:identificationRemarks=None, dwc:identificationVerificationStatus=None, dwc:identifiedBy=None, dwc:individualCount=None, dwc:individualID=None, dwc:informationWithheld=None, dwc:infraspecificEpithet=None, dwc:institutionCode='UConn', dwc:institutionID=None, dwc:island=None, dwc:islandGroup=None, dwc:kingdom='Dicotyledonae', dwc:latestAgeOrHighestStage=None, dwc:latestEonOrHighestEonothem=None, dwc:latestEpochOrHighestSeries=None, dwc:latestEraOrHighestErathem=None, dwc:latestPeriodOrHighestSystem=None, dwc:lifeStage=None, dwc:lithostratigraphicTerms=None, dwc:locality='mixed woods, Hell Brook Trail, below junction of trail to Taft Lodge, Mt. Mansfield, Vt.', dwc:locationAccordingTo='seconds added from gazetteer', dwc:locationID=None, dwc:locationRemarks=None, dwc:lowestBiostratigraphicZone=None, dwc:maximumDepthInMeters=None, dwc:maximumElevationInMeters=None, dwc:member=None, dwc:minimumDepthInMeters=None, dwc:minimumElevationInMeters=None, dwc:month='7', dwc:municipality='Cambridge', dwc:nameAccordingTo=None, dwc:nameAccordingToID=None, dwc:namePublishedIn=None, dwc:namePublishedInID=None, dwc:namePublishedInYear=None, dwc:nomenclaturalCode=None, dwc:nomenclaturalStatus=None, dwc:occurrenceDetails=None, dwc:occurrenceID='urn:catalog:UConn:CONN:CONN00078687', dwc:occurrenceRemarks=None, dwc:occurrenceStatus=None, dwc:order='Sapindales', dwc:organismID=None, dwc:originalNameUsage=None, dwc:otherCatalogNumbers=None, dwc:ownerInstitutionCode=None, dwc:parentNameUsage=None, dwc:phylum=None, dwc:preparations=None, dwc:previousIdentifications='Acer pensylvanicum L.', dwc:recordNumber='2330', dwc:recordedBy='"G.S. Torrey, G. Mehlquist & A.F. Hill"', dwc:reproductiveCondition='flowering', dwc:rights=None, dwc:rightsHolder=None, dwc:samplingEffort=None, dwc:samplingProtocol=None, dwc:scientificName='Acer pensylvanicum L.', dwc:scientificNameAuthorship=None, dwc:scientificNameID=None, dwc:sex=None, dwc:specificEpithet='pensylvanicum', dwc:startDayOfYear=None, dwc:stateProvince='Vermont', dwc:subgenus=None, dwc:taxonID=None, dwc:taxonRank=None, dwc:taxonRemarks=None, dwc:taxonomicStatus=None, dwc:typeStatus=None, dwc:verbatimCoordinateSystem=None, dwc:verbatimCoordinates=None, dwc:verbatimDepth=None, dwc:verbatimElevation=None, dwc:verbatimEventDate='24-Jul-35', dwc:verbatimLatitude='44°32\' 37" N', dwc:verbatimLocality=None, dwc:verbatimLongitude='072°48\' 51" W', dwc:verbatimSRS=None, dwc:verbatimTaxonRank=None, dwc:vernacularName='Moosewood; Snake-Bark Maple; Striped Maple', dwc:waterBody=None, dwc:year='1935', fcc:datePicked=None, fcc:pickedBy=None, id=None, idigbio:preservative=None, idigbio:recordId=None, idigbio:subfamily=None, idigbio:substrate=None, idigbio:superfamily=None, symbiota:recordEnteredBy=None, symbiota:verbatimScientificName=None), datecollected=datetime.datetime(1935, 7, 23, 20, 0), datemodified=datetime.datetime(2014, 9, 12, 15, 48, 39, 510000), dqs=0.23880596458911896, earliestageorloweststage=None, earliesteonorlowesteonothem=None, earliestepochorlowestseries=None, earliesteraorlowesterathem=None, earliestperiodorlowestsystem=None, etag='0489d8f9d651285e60a30a508ad0312f63a48a6e', eventdate='1935-07-24', family='sapindaceae', fieldnumber=None, formation=None, genus='acer', geologicalcontextid=None, geopoint=Row(lat=44.54361, lon=-72.81416), group=None, hasImage=True, hasMedia=True, highertaxon='plantae; dicotyledonae; sapindales; aceraceae', highestbiostratigraphiczone=None, individualcount=None, infraspecificepithet=None, institutioncode='uconn', institutionid=None, institutionname=None, kingdom='plantae', latestageorhigheststage=None, latesteonorhighesteonothem=None, latestepochorhighestseries=None, latesteraorhighesterathem=None, latestperiodorhighestsystem=None, lithostratigraphicterms=None, locality='mixed woods, hell brook trail, below junction of trail to taft lodge, mt. mansfield, vt.', lowestbiostratigraphiczone=None, maxdepth=None, maxelevation=None, member=None, mindepth=None, minelevation=None, municipality='cambridge', occurrenceid='urn:catalog:uconn:conn:conn00078687', order='sapindales', phylum='tracheophyta', recordnumber='2330', recordset='e70af26a-fb9e-43ab-96a0-d62a2df37e6d', scientificname='acer pensylvanicum l.', specificepithet='pensylvanicum', startdayofyear=205, stateprovince='vermont', taxonid='3189836', taxonomicstatus='accepted', taxonrank='species', typestatus=None, uuid='01bc9e79-8da9-4427-aff1-43bb757b6a5c', verbatimeventdate='24-jul-35', verbatimlocality=None, version=None, waterbody=None),
 Row(barcodevalue=None, basisofrecord='preservedspecimen', bed=None, canonicalname='acer dubium', catalognumber='2014.001', class='magnoliopsida', collectioncode='vascular', collectionid=None, collectionname=None, collector='susan anderson', commonname=None, continent='north america', coordinateuncertainty=None, country='united states', countrycode='usa', county='addison', data=Row(coreid=None, dc:rights=None, dcterms:accessRights=None, dcterms:bibliographicCitation=None, dcterms:language='en', dcterms:license='https://creativecommons.org/publicdomain/zero/1.0/', dcterms:modified='2015-04-03T20:24:23-0800', dcterms:references=None, dcterms:rights=None, dcterms:rightsHolder='Idaho State University, Ray J. Davis Herbarium', dcterms:source=None, dcterms:type='PhysicalObject', dwc:VerbatimEventDate=None, dwc:acceptedNameUsage='Acer rubrum', dwc:accessRights=None, dwc:associatedMedia=None, dwc:associatedOccurrences=None, dwc:associatedReferences=None, dwc:associatedSequences=None, dwc:associatedTaxa=None, dwc:basisOfRecord='PreservedSpecimen', dwc:bed=None, dwc:behavior=None, dwc:catalogNumber='2014.001', dwc:class=None, dwc:collectionCode='Vascular', dwc:collectionID=None, dwc:continent=None, dwc:coordinatePrecision=None, dwc:coordinateUncertaintyInMeters=None, dwc:country='U.S.A.', dwc:countryCode='US', dwc:county='Addison', dwc:dataGeneralizations=None, dwc:datasetID=None, dwc:datasetName=None, dwc:dateIdentified='1978-09-01', dwc:day='1', dwc:decimalLatitude=None, dwc:decimalLongitude=None, dwc:disposition=None, dwc:dynamicProperties=None, dwc:earliestAgeOrLowestStage=None, dwc:earliestEonOrLowestEonothem=None, dwc:earliestEpochOrLowestSeries=None, dwc:earliestEraOrLowestErathem=None, dwc:earliestPeriodOrLowestSystem=None, dwc:endDayOfYear='244', dwc:establishmentMeans=None, dwc:eventDate='1978-09-01', dwc:eventID=None, dwc:eventRemarks=None, dwc:eventTime=None, dwc:family='Sapindaceae', dwc:fieldNotes=None, dwc:fieldNumber=None, dwc:footprintWKT=None, dwc:formation=None, dwc:genus='Acer', dwc:geodeticDatum=None, dwc:geologicalContextID=None, dwc:georeferenceProtocol=None, dwc:georeferenceRemarks=None, dwc:georeferenceSources=None, dwc:georeferenceVerificationStatus=None, dwc:georeferencedBy=None, dwc:georeferencedDate=None, dwc:group=None, dwc:habitat=None, dwc:higherClassification='Sapindaceae', dwc:higherGeography='U.S.A., Vermont, Addison County', dwc:higherGeographyID=None, dwc:highestBiostratigraphicZone=None, dwc:identificationID=None, dwc:identificationQualifier=None, dwc:identificationReferences=None, dwc:identificationRemarks=None, dwc:identificationVerificationStatus=None, dwc:identifiedBy='Karl E. Holte', dwc:individualCount=None, dwc:individualID=None, dwc:informationWithheld=None, dwc:infraspecificEpithet=None, dwc:institutionCode='IDS', dwc:institutionID=None, dwc:island=None, dwc:islandGroup=None, dwc:kingdom=None, dwc:latestAgeOrHighestStage=None, dwc:latestEonOrHighestEonothem=None, dwc:latestEpochOrHighestSeries=None, dwc:latestEraOrHighestErathem=None, dwc:latestPeriodOrHighestSystem=None, dwc:lifeStage=None, dwc:lithostratigraphicTerms=None, dwc:locality='Middlebury.', dwc:locationAccordingTo=None, dwc:locationID=None, dwc:locationRemarks=None, dwc:lowestBiostratigraphicZone=None, dwc:maximumDepthInMeters=None, dwc:maximumElevationInMeters=None, dwc:member=None, dwc:minimumDepthInMeters=None, dwc:minimumElevationInMeters=None, dwc:month='9', dwc:municipality=None, dwc:nameAccordingTo=None, dwc:nameAccordingToID=None, dwc:namePublishedIn=None, dwc:namePublishedInID=None, dwc:namePublishedInYear=None, dwc:nomenclaturalCode='ICBN', dwc:nomenclaturalStatus=None, dwc:occurrenceDetails=None, dwc:occurrenceID='158a5394-129b-4065-bb75-a71e0ec91a41', dwc:occurrenceRemarks=None, dwc:occurrenceStatus=None, dwc:order=None, dwc:organismID=None, dwc:originalNameUsage=None, dwc:otherCatalogNumbers='Accession: 2014.001', dwc:ownerInstitutionCode='IDS', dwc:parentNameUsage=None, dwc:phylum=None, dwc:preparations=None, dwc:previousIdentifications=None, dwc:recordNumber='s.n.', dwc:recordedBy='Susan Anderson', dwc:reproductiveCondition='vegetative', dwc:rights=None, dwc:rightsHolder=None, dwc:samplingEffort=None, dwc:samplingProtocol=None, dwc:scientificName='Acer rubrum', dwc:scientificNameAuthorship='L.', dwc:scientificNameID=None, dwc:sex=None, dwc:specificEpithet='rubrum', dwc:startDayOfYear='244', dwc:stateProvince='Vermont', dwc:subgenus=None, dwc:taxonID=None, dwc:taxonRank='species', dwc:taxonRemarks=None, dwc:taxonomicStatus=None, dwc:typeStatus=None, dwc:verbatimCoordinateSystem=None, dwc:verbatimCoordinates=None, dwc:verbatimDepth=None, dwc:verbatimElevation=None, dwc:verbatimEventDate=None, dwc:verbatimLatitude=None, dwc:verbatimLocality=None, dwc:verbatimLongitude=None, dwc:verbatimSRS=None, dwc:verbatimTaxonRank=None, dwc:vernacularName=None, dwc:waterBody=None, dwc:year='1978', fcc:datePicked=None, fcc:pickedBy=None, id='2121559', idigbio:preservative=None, idigbio:recordId='3855114A-EE7C-405F-AC3B-0A26F855B278', idigbio:subfamily=None, idigbio:substrate=None, idigbio:superfamily=None, symbiota:recordEnteredBy=None, symbiota:verbatimScientificName=None), datecollected=datetime.datetime(1978, 8, 31, 20, 0), datemodified=datetime.datetime(2016, 10, 19, 17, 14, 30, 425000), dqs=0.17910447716712952, earliestageorloweststage=None, earliesteonorlowesteonothem=None, earliestepochorlowestseries=None, earliesteraorlowesterathem=None, earliestperiodorlowestsystem=None, etag='cc05c0440b536efa9fa962899feb4220f82ebec8', eventdate='1978-09-01', family='sapindaceae', fieldnumber=None, formation=None, genus='acer', geologicalcontextid=None, geopoint=None, group=None, hasImage=True, hasMedia=True, highertaxon='sapindaceae', highestbiostratigraphiczone=None, individualcount=None, infraspecificepithet=None, institutioncode='ids', institutionid=None, institutionname=None, kingdom='plantae', latestageorhigheststage=None, latesteonorhighesteonothem=None, latestepochorhighestseries=None, latesteraorhighesterathem=None, latestperiodorhighestsystem=None, lithostratigraphicterms=None, locality='middlebury.', lowestbiostratigraphiczone=None, maxdepth=None, maxelevation=None, member=None, mindepth=None, minelevation=None, municipality=None, occurrenceid='158a5394-129b-4065-bb75-a71e0ec91a41', order='sapindales', phylum='tracheophyta', recordnumber='s.n.', recordset='dd232f5c-7f53-48ec-9bb7-7205702c3dc8', scientificname='acer rubrum', specificepithet='rubrum', startdayofyear=244, stateprovince='vermont', taxonid='4924460', taxonomicstatus='accepted', taxonrank='species', typestatus=None, uuid='aa2c47ec-ea36-4579-a5d1-e809efa872d7', verbatimeventdate=None, verbatimlocality=None, version=None, waterbody=None),
 Row(barcodevalue=None, basisofrecord='preservedspecimen', bed=None, canonicalname='acer spicatum lam.', catalognumber=None, class='magnoliopsida', collectioncode=None, collectionid='4b4dd71f-d42c-4af9-837d-0a353ad73aa9', collectionname=None, collector='b. a. connolly & d. dorfer', commonname=None, continent='north america', coordinateuncertainty=None, country='united states', countrycode='usa', county='chittenden', data=Row(coreid=None, dc:rights='http://creativecommons.org/licenses/by-nc/3.0/', dcterms:accessRights=None, dcterms:bibliographicCitation=None, dcterms:language=None, dcterms:license=None, dcterms:modified='2016-08-23 15:48:40', dcterms:references='http://sernecportal.org/portal/collections/individual/index.php?occid=6253045', dcterms:rights=None, dcterms:rightsHolder=None, dcterms:source=None, dcterms:type=None, dwc:VerbatimEventDate=None, dwc:acceptedNameUsage=None, dwc:accessRights=None, dwc:associatedMedia=None, dwc:associatedOccurrences=None, dwc:associatedReferences=None, dwc:associatedSequences=None, dwc:associatedTaxa=None, dwc:basisOfRecord='PreservedSpecimen', dwc:bed=None, dwc:behavior=None, dwc:catalogNumber=None, dwc:class=None, dwc:collectionCode=None, dwc:collectionID='4b4dd71f-d42c-4af9-837d-0a353ad73aa9', dwc:continent=None, dwc:coordinatePrecision=None, dwc:coordinateUncertaintyInMeters=None, dwc:country='USA', dwc:countryCode=None, dwc:county='Chittenden', dwc:dataGeneralizations=None, dwc:datasetID=None, dwc:datasetName=None, dwc:dateIdentified=None, dwc:day='29', dwc:decimalLatitude=None, dwc:decimalLongitude=None, dwc:disposition=None, dwc:dynamicProperties=None, dwc:earliestAgeOrLowestStage=None, dwc:earliestEonOrLowestEonothem=None, dwc:earliestEpochOrLowestSeries=None, dwc:earliestEraOrLowestErathem=None, dwc:earliestPeriodOrLowestSystem=None, dwc:endDayOfYear=None, dwc:establishmentMeans=None, dwc:eventDate='2000-08-29', dwc:eventID=None, dwc:eventRemarks=None, dwc:eventTime=None, dwc:family='Aceraceae', dwc:fieldNotes=None, dwc:fieldNumber=None, dwc:footprintWKT=None, dwc:formation=None, dwc:genus='Acer', dwc:geodeticDatum=None, dwc:geologicalContextID=None, dwc:georeferenceProtocol=None, dwc:georeferenceRemarks=None, dwc:georeferenceSources=None, dwc:georeferenceVerificationStatus=None, dwc:georeferencedBy=None, dwc:georeferencedDate=None, dwc:group=None, dwc:habitat='In wooded area.', dwc:higherClassification=None, dwc:higherGeography=None, dwc:higherGeographyID=None, dwc:highestBiostratigraphicZone=None, dwc:identificationID=None, dwc:identificationQualifier=None, dwc:identificationReferences=None, dwc:identificationRemarks=None, dwc:identificationVerificationStatus=None, dwc:identifiedBy=None, dwc:individualCount=None, dwc:individualID=None, dwc:informationWithheld=None, dwc:infraspecificEpithet=None, dwc:institutionCode='MISS', dwc:institutionID=None, dwc:island=None, dwc:islandGroup=None, dwc:kingdom='Plantae', dwc:latestAgeOrHighestStage=None, dwc:latestEonOrHighestEonothem=None, dwc:latestEpochOrHighestSeries=None, dwc:latestEraOrHighestErathem=None, dwc:latestPeriodOrHighestSystem=None, dwc:lifeStage=None, dwc:lithostratigraphicTerms=None, dwc:locality='Richmond, Owls Head. Bleuberry Farm Hillview Rd.', dwc:locationAccordingTo=None, dwc:locationID=None, dwc:locationRemarks=None, dwc:lowestBiostratigraphicZone=None, dwc:maximumDepthInMeters=None, dwc:maximumElevationInMeters=None, dwc:member=None, dwc:minimumDepthInMeters=None, dwc:minimumElevationInMeters=None, dwc:month='8', dwc:municipality=None, dwc:nameAccordingTo=None, dwc:nameAccordingToID=None, dwc:namePublishedIn=None, dwc:namePublishedInID=None, dwc:namePublishedInYear=None, dwc:nomenclaturalCode=None, dwc:nomenclaturalStatus=None, dwc:occurrenceDetails=None, dwc:occurrenceID='ef3d67d0-a5c1-4eb7-a3be-e2cc68924cb2', dwc:occurrenceRemarks='Voucher for UM NCNPR Medicinal Plant Archive CON290800-3-A, B, C, D & E.', dwc:occurrenceStatus=None, dwc:order='Sapindales', dwc:organismID=None, dwc:originalNameUsage=None, dwc:otherCatalogNumbers='63104', dwc:ownerInstitutionCode=None, dwc:parentNameUsage=None, dwc:phylum='Magnoliophyta', dwc:preparations=None, dwc:previousIdentifications=None, dwc:recordNumber='180', dwc:recordedBy='B. A. Connolly & D. Dorfer', dwc:reproductiveCondition=None, dwc:rights=None, dwc:rightsHolder=None, dwc:samplingEffort=None, dwc:samplingProtocol=None, dwc:scientificName='Acer spicatum', dwc:scientificNameAuthorship='Lam.', dwc:scientificNameID=None, dwc:sex=None, dwc:specificEpithet='spicatum', dwc:startDayOfYear='242', dwc:stateProvince='Vermont', dwc:subgenus=None, dwc:taxonID=None, dwc:taxonRank=None, dwc:taxonRemarks=None, dwc:taxonomicStatus=None, dwc:typeStatus=None, dwc:verbatimCoordinateSystem=None, dwc:verbatimCoordinates=None, dwc:verbatimDepth=None, dwc:verbatimElevation=None, dwc:verbatimEventDate='8/29/2000', dwc:verbatimLatitude=None, dwc:verbatimLocality=None, dwc:verbatimLongitude=None, dwc:verbatimSRS=None, dwc:verbatimTaxonRank=None, dwc:vernacularName=None, dwc:waterBody=None, dwc:year='2000', fcc:datePicked=None, fcc:pickedBy=None, id='6253045', idigbio:preservative=None, idigbio:recordId='urn:uuid:ef3d67d0-a5c1-4eb7-a3be-e2cc68924cb2', idigbio:subfamily=None, idigbio:substrate=None, idigbio:superfamily=None, symbiota:recordEnteredBy=None, symbiota:verbatimScientificName=None), datecollected=datetime.datetime(2000, 8, 28, 20, 0), datemodified=datetime.datetime(2016, 10, 19, 17, 41, 47, 105000), dqs=0.17910447716712952, earliestageorloweststage=None, earliesteonorlowesteonothem=None, earliestepochorlowestseries=None, earliesteraorlowesterathem=None, earliestperiodorlowestsystem=None, etag='8e56820be53f41d469d6b36569f4e6289b187cc2', eventdate='2000-08-29', family='sapindaceae', fieldnumber=None, formation=None, genus='acer', geologicalcontextid=None, geopoint=None, group=None, hasImage=False, hasMedia=False, highertaxon=None, highestbiostratigraphiczone=None, individualcount=None, infraspecificepithet=None, institutioncode='miss', institutionid=None, institutionname=None, kingdom='plantae', latestageorhigheststage=None, latesteonorhighesteonothem=None, latestepochorhighestseries=None, latesteraorhighesterathem=None, latestperiodorhighestsystem=None, lithostratigraphicterms=None, locality='richmond, owls head. bleuberry farm hillview rd.', lowestbiostratigraphiczone=None, maxdepth=None, maxelevation=None, member=None, mindepth=None, minelevation=None, municipality=None, occurrenceid='ef3d67d0-a5c1-4eb7-a3be-e2cc68924cb2', order='sapindales', phylum='tracheophyta', recordnumber='180', recordset='5e29dbcc-ce45-4f05-9bb0-212baffa8932', scientificname='acer spicatum', specificepithet='spicatum', startdayofyear=242, stateprovince='vermont', taxonid='3189848', taxonomicstatus='accepted', taxonrank='species', typestatus=None, uuid='95a2769f-ac4a-46ff-8a53-3352ba7a5f1d', verbatimeventdate='8/29/2000', verbatimlocality=None, version=None, waterbody=None),
 Row(barcodevalue=None, basisofrecord='preservedspecimen', bed=None, canonicalname='acer nigrum michx. fil.', catalognumber='yu.076177', class='magnoliopsida', collectioncode='yu', collectionid='urn:lsid:biocol.org:col:14791', collectionname=None, collector='annette harkin', commonname=None, continent='north america', coordinateuncertainty=None, country='united states', countrycode='usa', county='chittenden', data=Row(coreid=None, dc:rights='http://creativecommons.org/publicdomain/zero/1.0/', dcterms:accessRights='Open Access, http://creativecommons.org/publicdomain/zero/1.0/; see Yale Peabody policies at: http://hdl.handle.net/10079/8931zqj', dcterms:bibliographicCitation=None, dcterms:language=None, dcterms:license=None, dcterms:modified='2015-10-29 10:04:57', dcterms:references='http://portal.neherbaria.org/portal/collections/individual/index.php?occid=807895', dcterms:rights=None, dcterms:rightsHolder='Yale Peabody Museum of Natural History', dcterms:source=None, dcterms:type=None, dwc:VerbatimEventDate=None, dwc:acceptedNameUsage=None, dwc:accessRights=None, dwc:associatedMedia=None, dwc:associatedOccurrences=None, dwc:associatedReferences=None, dwc:associatedSequences=None, dwc:associatedTaxa=None, dwc:basisOfRecord='PreservedSpecimen', dwc:bed=None, dwc:behavior=None, dwc:catalogNumber='YU.076177', dwc:class='Equisetopsida', dwc:collectionCode='YU', dwc:collectionID='urn:lsid:biocol.org:col:14791', dwc:continent=None, dwc:coordinatePrecision=None, dwc:coordinateUncertaintyInMeters=None, dwc:country='United States of America', dwc:countryCode=None, dwc:county='Chittenden', dwc:dataGeneralizations=None, dwc:datasetID=None, dwc:datasetName=None, dwc:dateIdentified=None, dwc:day='23', dwc:decimalLatitude=None, dwc:decimalLongitude=None, dwc:disposition=None, dwc:dynamicProperties=None, dwc:earliestAgeOrLowestStage=None, dwc:earliestEonOrLowestEonothem=None, dwc:earliestEpochOrLowestSeries=None, dwc:earliestEraOrLowestErathem=None, dwc:earliestPeriodOrLowestSystem=None, dwc:endDayOfYear=None, dwc:establishmentMeans=None, dwc:eventDate='1971-10-23', dwc:eventID=None, dwc:eventRemarks=None, dwc:eventTime=None, dwc:family='Sapindaceae', dwc:fieldNotes=None, dwc:fieldNumber=None, dwc:footprintWKT=None, dwc:formation=None, dwc:genus='Acer', dwc:geodeticDatum=None, dwc:geologicalContextID=None, dwc:georeferenceProtocol=None, dwc:georeferenceRemarks=None, dwc:georeferenceSources=None, dwc:georeferenceVerificationStatus=None, dwc:georeferencedBy=None, dwc:georeferencedDate=None, dwc:group=None, dwc:habitat=None, dwc:higherClassification=None, dwc:higherGeography=None, dwc:higherGeographyID=None, dwc:highestBiostratigraphicZone=None, dwc:identificationID=None, dwc:identificationQualifier=None, dwc:identificationReferences=None, dwc:identificationRemarks=None, dwc:identificationVerificationStatus=None, dwc:identifiedBy=None, dwc:individualCount=None, dwc:individualID=None, dwc:informationWithheld=None, dwc:infraspecificEpithet=None, dwc:institutionCode='Yale Peabody Museum of Natural History', dwc:institutionID=None, dwc:island=None, dwc:islandGroup=None, dwc:kingdom='Plantae', dwc:latestAgeOrHighestStage=None, dwc:latestEonOrHighestEonothem=None, dwc:latestEpochOrHighestSeries=None, dwc:latestEraOrHighestErathem=None, dwc:latestPeriodOrHighestSystem=None, dwc:lifeStage=None, dwc:lithostratigraphicTerms=None, dwc:locality=None, dwc:locationAccordingTo=None, dwc:locationID=None, dwc:locationRemarks=None, dwc:lowestBiostratigraphicZone=None, dwc:maximumDepthInMeters=None, dwc:maximumElevationInMeters=None, dwc:member=None, dwc:minimumDepthInMeters=None, dwc:minimumElevationInMeters=None, dwc:month='10', dwc:municipality='Burlington', dwc:nameAccordingTo=None, dwc:nameAccordingToID=None, dwc:namePublishedIn=None, dwc:namePublishedInID=None, dwc:namePublishedInYear=None, dwc:nomenclaturalCode=None, dwc:nomenclaturalStatus=None, dwc:occurrenceDetails=None, dwc:occurrenceID='urn:uuid:71056abd-6349-4ac6-b438-5fe2a8dbc929', dwc:occurrenceRemarks=None, dwc:occurrenceStatus=None, dwc:order='Sapindales', dwc:organismID=None, dwc:originalNameUsage=None, dwc:otherCatalogNumbers=None, dwc:ownerInstitutionCode=None, dwc:parentNameUsage=None, dwc:phylum='Charophyta', dwc:preparations=None, dwc:previousIdentifications=None, dwc:recordNumber=None, dwc:recordedBy='Annette Harkin', dwc:reproductiveCondition=None, dwc:rights=None, dwc:rightsHolder=None, dwc:samplingEffort=None, dwc:samplingProtocol=None, dwc:scientificName='Acer nigrum', dwc:scientificNameAuthorship='Michx. f.', dwc:scientificNameID=None, dwc:sex=None, dwc:specificEpithet='nigrum', dwc:startDayOfYear='296', dwc:stateProvince='Vermont', dwc:subgenus=None, dwc:taxonID=None, dwc:taxonRank=None, dwc:taxonRemarks=None, dwc:taxonomicStatus=None, dwc:typeStatus=None, dwc:verbatimCoordinateSystem=None, dwc:verbatimCoordinates=None, dwc:verbatimDepth=None, dwc:verbatimElevation=None, dwc:verbatimEventDate=None, dwc:verbatimLatitude=None, dwc:verbatimLocality=None, dwc:verbatimLongitude=None, dwc:verbatimSRS=None, dwc:verbatimTaxonRank=None, dwc:vernacularName=None, dwc:waterBody=None, dwc:year='1971', fcc:datePicked=None, fcc:pickedBy=None, id='807895', idigbio:preservative=None, idigbio:recordId='urn:uuid:89e9bf3a-3482-4a70-ad9c-3bb32263fbe8', idigbio:subfamily=None, idigbio:substrate=None, idigbio:superfamily=None, symbiota:recordEnteredBy='Bob Swerling', symbiota:verbatimScientificName=None), datecollected=datetime.datetime(1971, 10, 22, 20, 0), datemodified=datetime.datetime(2016, 1, 27, 16, 25, 22, 884000), dqs=0.19402985274791718, earliestageorloweststage=None, earliesteonorlowesteonothem=None, earliestepochorlowestseries=None, earliesteraorlowesterathem=None, earliestperiodorlowestsystem=None, etag='d8b816cd3f6f237dcc01241d3eb01f1ec1f4c19b', eventdate='1971-10-23', family='sapindaceae', fieldnumber=None, formation=None, genus='acer', geologicalcontextid=None, geopoint=None, group=None, hasImage=True, hasMedia=True, highertaxon=None, highestbiostratigraphiczone=None, individualcount=None, infraspecificepithet=None, institutioncode='yale peabody museum of natural history', institutionid=None, institutionname=None, kingdom='plantae', latestageorhigheststage=None, latesteonorhighesteonothem=None, latestepochorhighestseries=None, latesteraorhighesterathem=None, latestperiodorhighestsystem=None, lithostratigraphicterms=None, locality=None, lowestbiostratigraphiczone=None, maxdepth=None, maxelevation=None, member=None, mindepth=None, minelevation=None, municipality='burlington', occurrenceid='urn:uuid:71056abd-6349-4ac6-b438-5fe2a8dbc929', order='sapindales', phylum='tracheophyta', recordnumber=None, recordset='7a8d946d-083f-4d2a-9cc9-cd590398194f', scientificname='acer nigrum', specificepithet='nigrum', startdayofyear=296, stateprovince='vermont', taxonid='3189854', taxonomicstatus='accepted', taxonrank='species', typestatus=None, uuid='ca9827b5-7369-4eb6-a6dc-984d11b75fb7', verbatimeventdate=None, verbatimlocality=None, version=None, waterbody=None),
 Row(barcodevalue=None, basisofrecord='preservedspecimen', bed=None, canonicalname='acer dubium', catalognumber='yu.076214', class='magnoliopsida', collectioncode='yu', collectionid='urn:lsid:biocol.org:col:14791', collectionname=None, collector='a. f. hill; harold st. john', commonname=None, continent='north america', coordinateuncertainty=None, country='united states', countrycode='usa', county='windham', data=Row(coreid=None, dc:rights='http://creativecommons.org/publicdomain/zero/1.0/', dcterms:accessRights='Open Access, http://creativecommons.org/publicdomain/zero/1.0/; see Yale Peabody policies at: http://hdl.handle.net/10079/8931zqj', dcterms:bibliographicCitation=None, dcterms:language=None, dcterms:license=None, dcterms:modified='2015-10-29 10:04:57', dcterms:references='http://portal.neherbaria.org/portal/collections/individual/index.php?occid=807922', dcterms:rights=None, dcterms:rightsHolder='Yale Peabody Museum of Natural History', dcterms:source=None, dcterms:type=None, dwc:VerbatimEventDate=None, dwc:acceptedNameUsage=None, dwc:accessRights=None, dwc:associatedMedia=None, dwc:associatedOccurrences=None, dwc:associatedReferences=None, dwc:associatedSequences=None, dwc:associatedTaxa=None, dwc:basisOfRecord='PreservedSpecimen', dwc:bed=None, dwc:behavior=None, dwc:catalogNumber='YU.076214', dwc:class='Equisetopsida', dwc:collectionCode='YU', dwc:collectionID='urn:lsid:biocol.org:col:14791', dwc:continent=None, dwc:coordinatePrecision=None, dwc:coordinateUncertaintyInMeters=None, dwc:country='United States of America', dwc:countryCode=None, dwc:county='Windham', dwc:dataGeneralizations=None, dwc:datasetID=None, dwc:datasetName=None, dwc:dateIdentified=None, dwc:day='15', dwc:decimalLatitude=None, dwc:decimalLongitude=None, dwc:disposition=None, dwc:dynamicProperties=None, dwc:earliestAgeOrLowestStage=None, dwc:earliestEonOrLowestEonothem=None, dwc:earliestEpochOrLowestSeries=None, dwc:earliestEraOrLowestErathem=None, dwc:earliestPeriodOrLowestSystem=None, dwc:endDayOfYear=None, dwc:establishmentMeans=None, dwc:eventDate='1915-05-15', dwc:eventID=None, dwc:eventRemarks=None, dwc:eventTime=None, dwc:family='Sapindaceae', dwc:fieldNotes=None, dwc:fieldNumber=None, dwc:footprintWKT=None, dwc:formation=None, dwc:genus='Acer', dwc:geodeticDatum=None, dwc:geologicalContextID=None, dwc:georeferenceProtocol=None, dwc:georeferenceRemarks=None, dwc:georeferenceSources=None, dwc:georeferenceVerificationStatus=None, dwc:georeferencedBy=None, dwc:georeferencedDate=None, dwc:group=None, dwc:habitat=None, dwc:higherClassification=None, dwc:higherGeography=None, dwc:higherGeographyID=None, dwc:highestBiostratigraphicZone=None, dwc:identificationID=None, dwc:identificationQualifier=None, dwc:identificationReferences=None, dwc:identificationRemarks=None, dwc:identificationVerificationStatus=None, dwc:identifiedBy=None, dwc:individualCount=None, dwc:individualID=None, dwc:informationWithheld=None, dwc:infraspecificEpithet=None, dwc:institutionCode='Yale Peabody Museum of Natural History', dwc:institutionID=None, dwc:island=None, dwc:islandGroup=None, dwc:kingdom='Plantae', dwc:latestAgeOrHighestStage=None, dwc:latestEonOrHighestEonothem=None, dwc:latestEpochOrHighestSeries=None, dwc:latestEraOrHighestErathem=None, dwc:latestPeriodOrHighestSystem=None, dwc:lifeStage=None, dwc:lithostratigraphicTerms=None, dwc:locality=None, dwc:locationAccordingTo=None, dwc:locationID=None, dwc:locationRemarks=None, dwc:lowestBiostratigraphicZone=None, dwc:maximumDepthInMeters=None, dwc:maximumElevationInMeters=None, dwc:member=None, dwc:minimumDepthInMeters=None, dwc:minimumElevationInMeters=None, dwc:month='5', dwc:municipality='Whitingham', dwc:nameAccordingTo=None, dwc:nameAccordingToID=None, dwc:namePublishedIn=None, dwc:namePublishedInID=None, dwc:namePublishedInYear=None, dwc:nomenclaturalCode=None, dwc:nomenclaturalStatus=None, dwc:occurrenceDetails=None, dwc:occurrenceID='urn:uuid:a008cd8a-ad07-485a-aeaa-ca3a2fea1e38', dwc:occurrenceRemarks=None, dwc:occurrenceStatus=None, dwc:order='Sapindales', dwc:organismID=None, dwc:originalNameUsage=None, dwc:otherCatalogNumbers=None, dwc:ownerInstitutionCode=None, dwc:parentNameUsage=None, dwc:phylum='Charophyta', dwc:preparations=None, dwc:previousIdentifications=None, dwc:recordNumber=None, dwc:recordedBy='A. F. Hill; Harold St. John', dwc:reproductiveCondition=None, dwc:rights=None, dwc:rightsHolder=None, dwc:samplingEffort=None, dwc:samplingProtocol=None, dwc:scientificName='Acer rubrum', dwc:scientificNameAuthorship='L.', dwc:scientificNameID=None, dwc:sex=None, dwc:specificEpithet='rubrum', dwc:startDayOfYear='135', dwc:stateProvince='Vermont', dwc:subgenus=None, dwc:taxonID=None, dwc:taxonRank=None, dwc:taxonRemarks=None, dwc:taxonomicStatus=None, dwc:typeStatus=None, dwc:verbatimCoordinateSystem=None, dwc:verbatimCoordinates=None, dwc:verbatimDepth=None, dwc:verbatimElevation=None, dwc:verbatimEventDate=None, dwc:verbatimLatitude=None, dwc:verbatimLocality=None, dwc:verbatimLongitude=None, dwc:verbatimSRS=None, dwc:verbatimTaxonRank=None, dwc:vernacularName=None, dwc:waterBody=None, dwc:year='1915', fcc:datePicked=None, fcc:pickedBy=None, id='807922', idigbio:preservative=None, idigbio:recordId='urn:uuid:b7aaa1a6-39d2-47a5-8854-97a0111510cb', idigbio:subfamily=None, idigbio:substrate=None, idigbio:superfamily=None, symbiota:recordEnteredBy='Bob Swerling', symbiota:verbatimScientificName=None), datecollected=datetime.datetime(1915, 5, 14, 19, 0), datemodified=datetime.datetime(2016, 1, 27, 16, 25, 22, 884000), dqs=0.19402985274791718, earliestageorloweststage=None, earliesteonorlowesteonothem=None, earliestepochorlowestseries=None, earliesteraorlowesterathem=None, earliestperiodorlowestsystem=None, etag='2d0dd08be3593c13cdf5523dafdd544e2a4bdde0', eventdate='1915-05-15', family='sapindaceae', fieldnumber=None, formation=None, genus='acer', geologicalcontextid=None, geopoint=None, group=None, hasImage=True, hasMedia=True, highertaxon=None, highestbiostratigraphiczone=None, individualcount=None, infraspecificepithet=None, institutioncode='yale peabody museum of natural history', institutionid=None, institutionname=None, kingdom='plantae', latestageorhigheststage=None, latesteonorhighesteonothem=None, latestepochorhighestseries=None, latesteraorhighesterathem=None, latestperiodorhighestsystem=None, lithostratigraphicterms=None, locality=None, lowestbiostratigraphiczone=None, maxdepth=None, maxelevation=None, member=None, mindepth=None, minelevation=None, municipality='whitingham', occurrenceid='urn:uuid:a008cd8a-ad07-485a-aeaa-ca3a2fea1e38', order='sapindales', phylum='tracheophyta', recordnumber=None, recordset='7a8d946d-083f-4d2a-9cc9-cd590398194f', scientificname='acer rubrum', specificepithet='rubrum', startdayofyear=135, stateprovince='vermont', taxonid='4924460', taxonomicstatus='accepted', taxonrank='species', typestatus=None, uuid='90d8ab18-31c3-4843-afb8-2dcd150852d2', verbatimeventdate=None, verbatimlocality=None, version=None, waterbody=None),
 Row(barcodevalue=None, basisofrecord='preservedspecimen', bed=None, canonicalname='acer saccharinum l.', catalognumber='1416621', class='magnoliopsida', collectioncode='botany', collectionid=None, collectionname=None, collector='c. g. pringle', commonname=None, continent='north america', coordinateuncertainty=None, country='united states', countrycode='usa', county=None, data=Row(coreid=None, dc:rights=None, dcterms:accessRights=None, dcterms:bibliographicCitation=None, dcterms:language=None, dcterms:license=None, dcterms:modified=None, dcterms:references=None, dcterms:rights='https://creativecommons.org/publicdomain/zero/1.0/', dcterms:rightsHolder=None, dcterms:source=None, dcterms:type='PhysicalObject', dwc:VerbatimEventDate=None, dwc:acceptedNameUsage=None, dwc:accessRights=None, dwc:associatedMedia=None, dwc:associatedOccurrences=None, dwc:associatedReferences=None, dwc:associatedSequences=None, dwc:associatedTaxa=None, dwc:basisOfRecord='PreservedSpecimen', dwc:bed=None, dwc:behavior=None, dwc:catalogNumber='1416621', dwc:class='Dicotyledonae', dwc:collectionCode='Botany', dwc:collectionID=None, dwc:continent='North America', dwc:coordinatePrecision=None, dwc:coordinateUncertaintyInMeters=None, dwc:country='United States', dwc:countryCode=None, dwc:county=None, dwc:dataGeneralizations=None, dwc:datasetID=None, dwc:datasetName=None, dwc:dateIdentified=None, dwc:day='25', dwc:decimalLatitude=None, dwc:decimalLongitude=None, dwc:disposition=None, dwc:dynamicProperties=None, dwc:earliestAgeOrLowestStage=None, dwc:earliestEonOrLowestEonothem=None, dwc:earliestEpochOrLowestSeries=None, dwc:earliestEraOrLowestErathem=None, dwc:earliestPeriodOrLowestSystem=None, dwc:endDayOfYear='151', dwc:establishmentMeans=None, dwc:eventDate=None, dwc:eventID=None, dwc:eventRemarks=None, dwc:eventTime=None, dwc:family='Aceraceae', dwc:fieldNotes=None, dwc:fieldNumber=None, dwc:footprintWKT=None, dwc:formation=None, dwc:genus='Acer', dwc:geodeticDatum=None, dwc:geologicalContextID=None, dwc:georeferenceProtocol=None, dwc:georeferenceRemarks=None, dwc:georeferenceSources=None, dwc:georeferenceVerificationStatus=None, dwc:georeferencedBy=None, dwc:georeferencedDate=None, dwc:group=None, dwc:habitat='Swamp and river banks', dwc:higherClassification='Plantae, Dicotyledonae, Sapindales, Aceraceae', dwc:higherGeography='North America, United States, Vermont', dwc:higherGeographyID=None, dwc:highestBiostratigraphicZone=None, dwc:identificationID=None, dwc:identificationQualifier=None, dwc:identificationReferences=None, dwc:identificationRemarks=None, dwc:identificationVerificationStatus=None, dwc:identifiedBy=None, dwc:individualCount='1', dwc:individualID=None, dwc:informationWithheld=None, dwc:infraspecificEpithet=None, dwc:institutionCode='US', dwc:institutionID=None, dwc:island=None, dwc:islandGroup=None, dwc:kingdom='Plantae', dwc:latestAgeOrHighestStage=None, dwc:latestEonOrHighestEonothem=None, dwc:latestEpochOrHighestSeries=None, dwc:latestEraOrHighestErathem=None, dwc:latestPeriodOrHighestSystem=None, dwc:lifeStage='Flowering and fruiting', dwc:lithostratigraphicTerms=None, dwc:locality=None, dwc:locationAccordingTo=None, dwc:locationID=None, dwc:locationRemarks=None, dwc:lowestBiostratigraphicZone=None, dwc:maximumDepthInMeters=None, dwc:maximumElevationInMeters=None, dwc:member=None, dwc:minimumDepthInMeters=None, dwc:minimumElevationInMeters=None, dwc:month='4', dwc:municipality=None, dwc:nameAccordingTo=None, dwc:nameAccordingToID=None, dwc:namePublishedIn=None, dwc:namePublishedInID=None, dwc:namePublishedInYear=None, dwc:nomenclaturalCode=None, dwc:nomenclaturalStatus=None, dwc:occurrenceDetails=None, dwc:occurrenceID='http://n2t.net/ark:/65665/30a2d51b1-cea4-4066-9795-7dece5459b37', dwc:occurrenceRemarks=None, dwc:occurrenceStatus=None, dwc:order='Sapindales', dwc:organismID=None, dwc:originalNameUsage=None, dwc:otherCatalogNumbers=None, dwc:ownerInstitutionCode=None, dwc:parentNameUsage=None, dwc:phylum=None, dwc:preparations=None, dwc:previousIdentifications=None, dwc:recordNumber='s.n.', dwc:recordedBy='C. G. Pringle', dwc:reproductiveCondition=None, dwc:rights=None, dwc:rightsHolder=None, dwc:samplingEffort=None, dwc:samplingProtocol=None, dwc:scientificName='Acer saccharinum', dwc:scientificNameAuthorship='L.', dwc:scientificNameID=None, dwc:sex=None, dwc:specificEpithet='saccharinum', dwc:startDayOfYear='116', dwc:stateProvince='Vermont', dwc:subgenus=None, dwc:taxonID=None, dwc:taxonRank=None, dwc:taxonRemarks=None, dwc:taxonomicStatus=None, dwc:typeStatus=None, dwc:verbatimCoordinateSystem=None, dwc:verbatimCoordinates=None, dwc:verbatimDepth=None, dwc:verbatimElevation=None, dwc:verbatimEventDate='25 April ----', dwc:verbatimLatitude=None, dwc:verbatimLocality=None, dwc:verbatimLongitude=None, dwc:verbatimSRS=None, dwc:verbatimTaxonRank=None, dwc:vernacularName=None, dwc:waterBody=None, dwc:year=None, fcc:datePicked=None, fcc:pickedBy=None, id='http://n2t.net/ark:/65665/30a2d51b1-cea4-4066-9795-7dece5459b37', idigbio:preservative=None, idigbio:recordId=None, idigbio:subfamily=None, idigbio:substrate=None, idigbio:superfamily=None, symbiota:recordEnteredBy=None, symbiota:verbatimScientificName=None), datecollected=None, datemodified=datetime.datetime(2016, 9, 22, 10, 42, 32, 961000), dqs=0.16417910158634186, earliestageorloweststage=None, earliesteonorlowesteonothem=None, earliestepochorlowestseries=None, earliesteraorlowesterathem=None, earliestperiodorlowestsystem=None, etag='240e603ec7c864dc590a6686bb3971cf67d9760b', eventdate=None, family='sapindaceae', fieldnumber=None, formation=None, genus='acer', geologicalcontextid=None, geopoint=None, group=None, hasImage=False, hasMedia=False, highertaxon='plantae, dicotyledonae, sapindales, aceraceae', highestbiostratigraphiczone=None, individualcount=1.0, infraspecificepithet=None, institutioncode='us', institutionid=None, institutionname=None, kingdom='plantae', latestageorhigheststage=None, latesteonorhighesteonothem=None, latestepochorhighestseries=None, latesteraorhighesterathem=None, latestperiodorhighestsystem=None, lithostratigraphicterms=None, locality=None, lowestbiostratigraphiczone=None, maxdepth=None, maxelevation=None, member=None, mindepth=None, minelevation=None, municipality=None, occurrenceid='http://n2t.net/ark:/65665/30a2d51b1-cea4-4066-9795-7dece5459b37', order='sapindales', phylum='tracheophyta', recordnumber='s.n.', recordset='a6eee223-cf3b-4079-8bb2-b77dad8cae9d', scientificname='acer saccharinum', specificepithet='saccharinum', startdayofyear=None, stateprovince='vermont', taxonid='3189837', taxonomicstatus='accepted', taxonrank='species', typestatus=None, uuid='ad666807-792f-4c2a-83fe-0740c5a48129', verbatimeventdate='25 april ----', verbatimlocality=None, version=None, waterbody=None),
 Row(barcodevalue=None, basisofrecord='preservedspecimen', bed=None, canonicalname='acer pensylvanicum l.', catalognumber='81286', class='magnoliopsida', collectioncode='upcb', collectionid=None, collectionname=None, collector='litzelman, c.', commonname=None, continent='north america', coordinateuncertainty=None, country='united states', countrycode='usa', county=None, data=Row(coreid=None, dc:rights=None, dcterms:accessRights=None, dcterms:bibliographicCitation=None, dcterms:language='pt', dcterms:license=None, dcterms:modified='2016-07-29 18:20:58-03', dcterms:references=None, dcterms:rights='Creative Commons Attribution Non Commercial (CC-BY-NC) 4.0 License.', dcterms:rightsHolder='UPCB - Herbário do Departamento de Botânica', dcterms:source=None, dcterms:type='Collection', dwc:VerbatimEventDate=None, dwc:acceptedNameUsage=None, dwc:accessRights=None, dwc:associatedMedia=None, dwc:associatedOccurrences=None, dwc:associatedReferences=None, dwc:associatedSequences=None, dwc:associatedTaxa=None, dwc:basisOfRecord='PreservedSpecimen', dwc:bed=None, dwc:behavior=None, dwc:catalogNumber='81286', dwc:class=None, dwc:collectionCode='UPCB', dwc:collectionID=None, dwc:continent=None, dwc:coordinatePrecision=None, dwc:coordinateUncertaintyInMeters=None, dwc:country='Estados Unidos', dwc:countryCode=None, dwc:county=None, dwc:dataGeneralizations=None, dwc:datasetID=None, dwc:datasetName='UPCB - Herbário do Departamento de Botânica', dwc:dateIdentified=None, dwc:day='30', dwc:decimalLatitude='44.1169999999999973', dwc:decimalLongitude='-72.6670000000000016', dwc:disposition=None, dwc:dynamicProperties=None, dwc:earliestAgeOrLowestStage=None, dwc:earliestEonOrLowestEonothem=None, dwc:earliestEpochOrLowestSeries=None, dwc:earliestEraOrLowestErathem=None, dwc:earliestPeriodOrLowestSystem=None, dwc:endDayOfYear=None, dwc:establishmentMeans=None, dwc:eventDate=None, dwc:eventID=None, dwc:eventRemarks=None, dwc:eventTime=None, dwc:family='Sapindaceae', dwc:fieldNotes=None, dwc:fieldNumber=None, dwc:footprintWKT=None, dwc:formation=None, dwc:genus='Acer', dwc:geodeticDatum=None, dwc:geologicalContextID=None, dwc:georeferenceProtocol=None, dwc:georeferenceRemarks=None, dwc:georeferenceSources=None, dwc:georeferenceVerificationStatus=None, dwc:georeferencedBy=None, dwc:georeferencedDate=None, dwc:group=None, dwc:habitat=None, dwc:higherClassification=None, dwc:higherGeography=None, dwc:higherGeographyID=None, dwc:highestBiostratigraphicZone=None, dwc:identificationID=None, dwc:identificationQualifier=None, dwc:identificationReferences=None, dwc:identificationRemarks=None, dwc:identificationVerificationStatus=None, dwc:identifiedBy=None, dwc:individualCount=None, dwc:individualID=None, dwc:informationWithheld=None, dwc:infraspecificEpithet=None, dwc:institutionCode='UFPR', dwc:institutionID=None, dwc:island=None, dwc:islandGroup=None, dwc:kingdom='Plantae', dwc:latestAgeOrHighestStage=None, dwc:latestEonOrHighestEonothem=None, dwc:latestEpochOrHighestSeries=None, dwc:latestEraOrHighestErathem=None, dwc:latestPeriodOrHighestSystem=None, dwc:lifeStage=None, dwc:lithostratigraphicTerms=None, dwc:locality='Garvey Hill: Northfield, VT', dwc:locationAccordingTo=None, dwc:locationID=None, dwc:locationRemarks=None, dwc:lowestBiostratigraphicZone=None, dwc:maximumDepthInMeters=None, dwc:maximumElevationInMeters=None, dwc:member=None, dwc:minimumDepthInMeters=None, dwc:minimumElevationInMeters=None, dwc:month='11', dwc:municipality=None, dwc:nameAccordingTo=None, dwc:nameAccordingToID=None, dwc:namePublishedIn=None, dwc:namePublishedInID=None, dwc:namePublishedInYear=None, dwc:nomenclaturalCode=None, dwc:nomenclaturalStatus=None, dwc:occurrenceDetails=None, dwc:occurrenceID='BRA:UFPR:UPCB:0000081286', dwc:occurrenceRemarks='Found in woods.', dwc:occurrenceStatus=None, dwc:order=None, dwc:organismID=None, dwc:originalNameUsage=None, dwc:otherCatalogNumbers=None, dwc:ownerInstitutionCode='Universidade Federal do Paraná, UFPR', dwc:parentNameUsage=None, dwc:phylum=None, dwc:preparations=None, dwc:previousIdentifications=None, dwc:recordNumber='53', dwc:recordedBy='Litzelman, C.', dwc:reproductiveCondition=None, dwc:rights=None, dwc:rightsHolder=None, dwc:samplingEffort=None, dwc:samplingProtocol=None, dwc:scientificName='Acer pensylvanicum', dwc:scientificNameAuthorship='L.', dwc:scientificNameID=None, dwc:sex=None, dwc:specificEpithet='pensylvanicum', dwc:startDayOfYear=None, dwc:stateProvince='Vermont', dwc:subgenus=None, dwc:taxonID=None, dwc:taxonRank=None, dwc:taxonRemarks=None, dwc:taxonomicStatus=None, dwc:typeStatus=None, dwc:verbatimCoordinateSystem=None, dwc:verbatimCoordinates=None, dwc:verbatimDepth=None, dwc:verbatimElevation=None, dwc:verbatimEventDate=None, dwc:verbatimLatitude='44.117', dwc:verbatimLocality=None, dwc:verbatimLongitude='-72.667', dwc:verbatimSRS=None, dwc:verbatimTaxonRank=None, dwc:vernacularName=None, dwc:waterBody=None, dwc:year='1992', fcc:datePicked=None, fcc:pickedBy=None, id='BRA:UFPR:UPCB:0000081286', idigbio:preservative=None, idigbio:recordId=None, idigbio:subfamily=None, idigbio:substrate=None, idigbio:superfamily=None, symbiota:recordEnteredBy=None, symbiota:verbatimScientificName=None), datecollected=datetime.datetime(1992, 11, 30, 0, 0), datemodified=datetime.datetime(2016, 8, 31, 9, 29, 25, 708000), dqs=0.1492537260055542, earliestageorloweststage=None, earliesteonorlowesteonothem=None, earliestepochorlowestseries=None, earliesteraorlowesterathem=None, earliestperiodorlowestsystem=None, etag='919b6debd9dab02219fce8feb1ef613833a8e0be', eventdate=None, family='sapindaceae', fieldnumber=None, formation=None, genus='acer', geologicalcontextid=None, geopoint=Row(lat=44.117, lon=-72.667), group=None, hasImage=False, hasMedia=False, highertaxon=None, highestbiostratigraphiczone=None, individualcount=None, infraspecificepithet=None, institutioncode='ufpr', institutionid=None, institutionname=None, kingdom='plantae', latestageorhigheststage=None, latesteonorhighesteonothem=None, latestepochorhighestseries=None, latesteraorhighesterathem=None, latestperiodorhighestsystem=None, lithostratigraphicterms=None, locality='garvey hill: northfield, vt', lowestbiostratigraphiczone=None, maxdepth=None, maxelevation=None, member=None, mindepth=None, minelevation=None, municipality=None, occurrenceid='bra:ufpr:upcb:0000081286', order='sapindales', phylum='tracheophyta', recordnumber='53', recordset='7311c4ac-7cf6-4160-a55c-4a4c7cd0cf89', scientificname='acer pensylvanicum', specificepithet='pensylvanicum', startdayofyear=335, stateprovince='vermont', taxonid='3189836', taxonomicstatus='accepted', taxonrank='species', typestatus=None, uuid='a4cc5fed-d924-4d1b-94fe-65271064593b', verbatimeventdate=None, verbatimlocality=None, version=None, waterbody=None)]

In [23]:
df.count()


Out[23]:
447

In [24]:
df.select(df["uuid"]).head(10)


Out[24]:
[Row(uuid='2309622d-a818-4456-b51b-b8bd79587baa'),
 Row(uuid='ef76c868-e5f8-4788-9c31-32947bfdc122'),
 Row(uuid='8536ba01-e79a-4430-b262-3a91305e2df2'),
 Row(uuid='4f8e4b95-5c23-4378-8702-56816b281c51'),
 Row(uuid='3ca004b6-67cc-4fa1-b1b6-40a5e1608b15'),
 Row(uuid='d3ab9e5a-d143-41eb-be2d-780b8b04ea8e'),
 Row(uuid='b7a42fe6-4e67-40ec-9f96-7496e1a59f38'),
 Row(uuid='640f59a8-c1ae-4cbf-9fd7-0b3e9bc3db7d'),
 Row(uuid='adbf7eb7-dc64-4bdc-aa84-7f90e5928b84'),
 Row(uuid='32aa482d-0af5-4ea7-93ae-3035e9c18b35')]

In [25]:
(df.write
.mode("overwrite")
.parquet("/outputs/scrap")
)

In [ ]: