2023-04-19 08:57:03 -05:00

84 lines
2.4 KiB
Python

import typer
import pymongo
import pandas as pd
import numpy as np
import math
MONGO_URL = "mongodb://localhost:27017/"
MONGO_DB = "dev"
def upload_to_mongo(resources, ar_col):
ar_col.insert_many(resources)
def get_entry(row, col, default_val=np.nan):
'''
Parameters
----------
default_val : any
If NaN is returned for entry, default to this.
'''
if row.loc[col]['entry'] is np.nan:
return default_val
return row.loc[col]['entry']
def get_manufacturer(row, col):
'''
Get entry column for a manufacturer.
'''
if row.loc[col]['entry'] is np.nan:
return None
required = row.loc[col]['required']
return {
"name": row.loc[col]['entry'],
"required": isinstance(required, str)
}
def get_selected_options(row, col):
return row.loc[col].dropna(inplace=False).index.to_list()
def get_range(row, col):
return {
"min": int(row.loc[col]['min']),
"max": int(row.loc[col]['max'])
}
def get_platform_links(row):
platforms = row['Platforms:'].dropna(inplace=False)
return [{"link": platforms[key], "platform": key} for key in platforms.index]
def main(path: str):
df = pd.read_excel(path, header=[0,1])
mongo_client = pymongo.MongoClient(MONGO_URL)
mongo_db = mongo_client[MONGO_DB]
ar_col = mongo_db["AuditoryResource"]
resources = []
for i in range(0,len(df.index)):
resource = {}
resource["name"] = get_entry(df.iloc[i], 'Resource:', "n/a")
resource["icon"] = get_entry(df.iloc[i], 'Icon:', "")
resource["description"] = get_entry(df.iloc[i], 'Description:', "n/a")
resource["manufacturer"] = get_manufacturer(df.iloc[i], 'Manufacturer:')
resource["platform_links"] = get_platform_links(df.iloc[i])
resource["ages"] = get_range(df.iloc[i], 'Age Group:')
resource["skills"] = get_selected_options(df.iloc[i], 'Skills:')
resource["skill_levels"] = get_selected_options(df.iloc[i], 'Skill Level:')
resource["payment_options"] = get_selected_options(df.iloc[i], 'Cost:')
print(f"Finished parsing resource on line {i+2}:")
print(resource)
print("--------------------------------\n")
resources.append(resource)
print("Uploading to MongoDB...")
upload_to_mongo(resources, ar_col)
print("Upload success!")
if __name__ == "__main__":
typer.run(main)