igdb/code/database/parse_csv.py

from pandas import read_csv, concat, DataFrame
from iso3166 import countries as co


def country_conversion(political_unit) -> str:
    codes = co.get(political_unit)
    return codes.name


def select_columns() -> DataFrame:
    min_year = 2010
    fields = [
        "POLITICAL_UNIT",
        "WGMS_ID",
        "YEAR",
        "AREA_SURVEY_YEAR",
        "AREA_CHANGE",
        "THICKNESS CHANGE",
        "VOLUME_CHANGE",
    ]
    iter_csv = read_csv(
        "../../data/WGMS-FoG-2019-12-D-CHANGE.csv",
        skipinitialspace=True,
        usecols=fields,
        iterator=True,
        chunksize=100,
        converters={"YEAR": country_conversion},
    )
    data = concat([chunk[chunk["YEAR"] > min_year] for chunk in iter_csv])
    return data
Rename code folder and add filters to parser 2020-01-05 01:00:06 +01:00			`from pandas import read_csv, concat, DataFrame`
Create constants file and move tables to db_setup 2020-01-05 02:51:14 +01:00			`from iso3166 import countries as co`
Rename code folder and add filters to parser 2020-01-05 01:00:06 +01:00

Create constants file and move tables to db_setup 2020-01-05 02:51:14 +01:00			`def country_conversion(political_unit) -> str:`
			`codes = co.get(political_unit)`
			`return codes.name`


			`def select_columns() -> DataFrame:`
Rename code folder and add filters to parser 2020-01-05 01:00:06 +01:00			`min_year = 2010`
Create constants file and move tables to db_setup 2020-01-05 02:51:14 +01:00			`fields = [`
			`"POLITICAL_UNIT",`
			`"WGMS_ID",`
			`"YEAR",`
			`"AREA_SURVEY_YEAR",`
			`"AREA_CHANGE",`
			`"THICKNESS CHANGE",`
			`"VOLUME_CHANGE",`
			`]`
Rename code folder and add filters to parser 2020-01-05 01:00:06 +01:00			`iter_csv = read_csv(`
Create constants file and move tables to db_setup 2020-01-05 02:51:14 +01:00			`"../../data/WGMS-FoG-2019-12-D-CHANGE.csv",`
Rename code folder and add filters to parser 2020-01-05 01:00:06 +01:00			`skipinitialspace=True,`
			`usecols=fields,`
			`iterator=True,`
			`chunksize=100,`
Create constants file and move tables to db_setup 2020-01-05 02:51:14 +01:00			`converters={"YEAR": country_conversion},`
Rename code folder and add filters to parser 2020-01-05 01:00:06 +01:00			`)`
			`data = concat([chunk[chunk["YEAR"] > min_year] for chunk in iter_csv])`
			`return data`