# Install lipd and cartopy
!pip install lipd
!pip install cartopy==0.19.0.post1

# In Google Colab, cartopy and shapely don't get along well. These lines are only necessary in Google Colab, to make sure cartopy works correctly
!pip install --no-binary shapely shapely --force
import warnings
from shapely.errors import ShapelyDeprecationWarning
warnings.filterwarnings('ignore',category=ShapelyDeprecationWarning)

# Mount Google Drive locally
from google.colab import drive
drive.mount('/content/drive')


import numpy as np
import matplotlib.pyplot as plt
import cartopy.crs as ccrs
import cartopy.feature as cfeature
import pickle
import lipd
plt.style.use('ggplot')  # This sets the plotting style for the figures we'll be making later.


# Load the Temp12k proxy metadata
data_dir = '/content/drive/MyDrive/using_lipd_files/lipd_data/'  # Update this line to where your data is stored.
file_to_open = open(data_dir+'Temp12k1_0_2.pkl','rb')
proxies_all = pickle.load(file_to_open)['D']
file_to_open.close()


# Load the Temp12k proxy metadata
data_dir = '/content/drive/MyDrive/using_lipd_files/lipd_data/Temp12k1_0_2/'  # Update this line to where your data is stored.
proxies_all = lipd.readLipd(data_dir)


# Extract the time series and use only those which are in Temp12k and in units of degC
all_ts = lipd.extractTs(proxies_all)
proxy_ts = lipd.filterTs(all_ts,  'paleoData_inCompilation == Temp12k')
proxy_ts = lipd.filterTs(proxy_ts,'paleoData_units == degC')
n_proxies = len(proxy_ts)


print(type(proxy_ts),len(proxy_ts))
print(type(proxy_ts[0]))


print(proxy_ts[0])


# Get data
index_chosen = 0
proxy_data   = np.array(proxy_ts[index_chosen]['paleoData_values']).astype(float)
proxy_ages   = np.array(proxy_ts[index_chosen]['age']).astype(float)
dataset_name = proxy_ts[index_chosen]['dataSetName']

# Make a simple figure
plt.plot(proxy_ages,proxy_data)
plt.xlabel('Age ('+proxy_ts[index_chosen]['ageUnits']+')')
plt.ylabel('T ('+proxy_ts[index_chosen]['paleoData_units']+')')
plt.title(dataset_name)
plt.show()


# Print a sorted list of a selected variable
def print_sorted_list(key):
    #
    # Make a list of all values of the given key
    variable_all = []
    for i in range(n_proxies):
        try:    variable_all.append(proxy_ts[i][key])
        except: variable_all.append('not given')
    #
    # Count the number of each name
    name_words,name_counts = np.unique(variable_all,return_counts=True)
    count_sort_ind = np.argsort(-name_counts)
    name_words_sorted  = name_words[count_sort_ind]
    name_counts_sorted = name_counts[count_sort_ind]
    #
    # Print the counts
    print('===',key,'===')
    for i in range(len(name_counts_sorted)):
        print('%25s %5s' % (name_words_sorted[i],name_counts_sorted[i]))


print_sorted_list('archiveType')


# Create empty arrays to store the lats and lons
lats_all = np.zeros((n_proxies)); lats_all[:] = np.nan
lons_all = np.zeros((n_proxies)); lons_all[:] = np.nan

# Loop through all proxy records, storing the lats and lons in the newly-created arrays
for i in range(n_proxies):
    lats_all[i] = proxy_ts[i]['geo_meanLat']
    lons_all[i] = proxy_ts[i]['geo_meanLon']


# A function to make a map of all proxy locations in a given region
def proxy_map(map_bounds):
    #
    # Count the number of proxy records in this region 
    n_selected = len(np.where((lons_all >= map_bounds[0]) & (lons_all <= map_bounds[1]) & (lats_all >= map_bounds[2]) & (lats_all <= map_bounds[3]))[0])
    #
    # Plot the locations of all proxy records in the region
    plt.figure(figsize=(12,20))
    ax1 = plt.subplot2grid((1,1),(0,0),projection=ccrs.PlateCarree()); ax1.set_extent(map_bounds,crs=ccrs.PlateCarree())
    ax1.scatter(lons_all,lats_all,25,c='r',marker='o',alpha=1,transform=ccrs.PlateCarree())
    ax1.coastlines()
    ax1.gridlines(color='k',linestyle='--',draw_labels=True)
    ax1.set_title('Locations of '+str(n_selected)+' proxy records',fontsize=14,loc='center')
    plt.show()

# A function to print selected metadata of all proxies in a given region.
def proxy_metadata(region_bounds):
    #
    ind_selected = np.where((lons_all >= region_bounds[0]) & (lons_all <= region_bounds[1]) & (lats_all >= region_bounds[2]) & (lats_all <= region_bounds[3]))[0]
    print('Records found in the region',region_bounds,':',len(ind_selected))
    #
    # Print some metadata for the selected proxies
    print_fmt = '%5s %30s %16s %12s %12s %10s %10s %12s %-10s'
    print(print_fmt % ('Index','dataSetName','Archive','Proxy','Variable','Lat','Lon','Season','Original_URL'))
    print(print_fmt % ('=====','===========','=======','=====','========','===','===','======','============'))
    for i in ind_selected:
        print(print_fmt % (i, \
                           proxy_ts[i]['dataSetName'], \
                           proxy_ts[i]['archiveType'], \
                           proxy_ts[i]['paleoData_proxy'], \
                           proxy_ts[i]['paleoData_variableName'], \
                           proxy_ts[i]['geo_meanLat'], \
                           proxy_ts[i]['geo_meanLon'], \
                           proxy_ts[i]['paleoData_interpretation'][0]['seasonalityGeneral'], \
                           proxy_ts[i]['originalDataUrl']))


# Make a global map
proxy_map([-180,180,-90,90])


# Map and list the proxies in a given region
region_selected = [60,120,0,30]  # Give values in the format [lon_min, lon_max, lat_min, lat_max]
proxy_map(region_selected)
proxy_metadata(region_selected)

Key	Explanation
paleoData_values	The proxy record data
age	The proxy record ages
dataSetName	Data set name
paleoData_TSid	The "TSid," which is a unique identifier for the proxy record
archiveType	Archive type
paleoData_proxyGeneral	General proxy type
paleoData_proxy	Specific proxy type
paleoData_variableName	Variable
geo_meanLat	Latitude (-90 to 90)
geo_meanLon	Longitude (-180 to 180)
geo_meanElev	Elevation (m)
paleoData_interpretation	Notes about the interpretation of the proxy record
originalDataUrl	The URL of the original proxy record
paleoData_units	Units of the data
ageUnits	Units of the ages

Loading and Visualizing LiPD Proxy Data in Python¶

Introduction¶

1. Setting up Google Colab¶

2. Importing necessary libraries¶

3. Loading proxy data¶

4. Exploring the Proxy Metadata¶

5. Making figures¶