Code development platform for open source projects from the European Union institutions

Skip to content
Snippets Groups Projects
main.py 777 B
Newer Older
Thomas Vliagkoftis's avatar
Thomas Vliagkoftis committed
#!/usr/bin/env/ python

from uds4jrc.config import Config
from uds4jrc.db import eea_raw_data
Thomas Vliagkoftis's avatar
Thomas Vliagkoftis committed
from munch import Munch
from collections import defaultdict

import pandas as pd

Thomas Vliagkoftis's avatar
Thomas Vliagkoftis committed
file_config = Munch(Config.EEA_2019)
Thomas Vliagkoftis's avatar
Thomas Vliagkoftis committed

chunks = pd.read_csv(
Thomas Vliagkoftis's avatar
Thomas Vliagkoftis committed
    '/eos/jeodpp/data/projects/LEGENT/transfer/EEA_passenger_cars_2019_final_AMI.csv',
Thomas Vliagkoftis's avatar
Thomas Vliagkoftis committed
    delimiter=file_config.delimiter,
    header=0,
    dtype=defaultdict(lambda: object, file_config.column_properties.iloc[:, 1:3].values),
    names=file_config.column_properties.iloc[:, 0].values,
    chunksize=100000,
    encoding=file_config.encoding,
    index_col=False,
    low_memory=False
)

for df in chunks:

    del df['id']
    df['file_year'] = file_config.year
    df['version'] = 1.0

    eea_raw_data.insert_many(df.to_dict('records'))