-
Notifications
You must be signed in to change notification settings - Fork 0
/
settings.py
executable file
·40 lines (31 loc) · 1021 Bytes
/
settings.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
__author__ = '@jotegui'
# Import modules in lib folder
import os
import sys
sys.path.insert(0, os.path.join(os.path.dirname(__file__), 'lib'))
# Example: eBird processing
# Data source: "ebird" or "gbif"
source = "gbif"
# Name of the main data table in RedShift
redshift_table = "gbif_jun_15"
# Slim list of fields and their type
fields = [
["gbifid", "bigint"],
["decimallatitude", "double precision"],
["decimallongitude", "double precision"],
["coordinateaccuracy", "varchar(256)"],
["species", "varchar(256)"],
["eventdate", "varchar(20)"],
["year", "integer"],
["datasetkey", "varchar(256)"],
["basisofrecord", "varchar(256)"]
]
# Name of the local folder to store the slim slices
slices_folder = "slim"
# Name of the field that contains the scientific name in Redshift
sciname_field = "species"
# Names of the coordinate fields
latitude_field = "decimallatitude"
longitude_field = "decimallongitude"
# Maximum number of rows in each partition table
threshold = 10000000