renamed script to excel processor
This commit is contained in:
1
excelProccessor/import/__init__.py
Normal file
1
excelProccessor/import/__init__.py
Normal file
@ -0,0 +1 @@
|
||||
__version__ = '0.1.0'
|
83
excelProccessor/import/main.py
Normal file
83
excelProccessor/import/main.py
Normal file
@ -0,0 +1,83 @@
|
||||
import typer
|
||||
import pymongo
|
||||
import pandas as pd
|
||||
import numpy as np
|
||||
import math
|
||||
|
||||
MONGO_URL = "mongodb://localhost:27017/"
|
||||
MONGO_DB = "dev"
|
||||
|
||||
def upload_to_mongo(resources, ar_col):
|
||||
ar_col.insert_many(resources)
|
||||
|
||||
def get_entry(row, col, default_val=np.nan):
|
||||
'''
|
||||
Parameters
|
||||
----------
|
||||
default_val : any
|
||||
If NaN is returned for entry, default to this.
|
||||
'''
|
||||
if row.loc[col]['entry'] is np.nan:
|
||||
return default_val
|
||||
return row.loc[col]['entry']
|
||||
|
||||
def get_manufacturer(row, col):
|
||||
'''
|
||||
Get entry column for a manufacturer.
|
||||
'''
|
||||
if row.loc[col]['entry'] is np.nan:
|
||||
return None
|
||||
|
||||
required = row.loc[col]['required']
|
||||
return {
|
||||
"name": row.loc[col]['entry'],
|
||||
"required": isinstance(required, str)
|
||||
}
|
||||
|
||||
def get_selected_options(row, col):
|
||||
return row.loc[col].dropna(inplace=False).index.to_list()
|
||||
|
||||
def get_range(row, col):
|
||||
return {
|
||||
"min": int(row.loc[col]['min']),
|
||||
"max": int(row.loc[col]['max'])
|
||||
}
|
||||
|
||||
def get_platform_links(row):
|
||||
platforms = row['Platforms:'].dropna(inplace=False)
|
||||
return [{"link": platforms[key], "platform": key} for key in platforms.index]
|
||||
|
||||
def main(path: str):
|
||||
df = pd.read_excel(path, header=[0,1])
|
||||
|
||||
mongo_client = pymongo.MongoClient(MONGO_URL)
|
||||
mongo_db = mongo_client[MONGO_DB]
|
||||
ar_col = mongo_db["AuditoryResource"]
|
||||
|
||||
resources = []
|
||||
|
||||
for i in range(0,len(df.index)):
|
||||
resource = {}
|
||||
|
||||
resource["name"] = get_entry(df.iloc[i], 'Resource:', "n/a")
|
||||
resource["icon"] = get_entry(df.iloc[i], 'Icon:', "")
|
||||
resource["description"] = get_entry(df.iloc[i], 'Description:', "n/a")
|
||||
resource["manufacturer"] = get_manufacturer(df.iloc[i], 'Manufacturer:')
|
||||
resource["platform_links"] = get_platform_links(df.iloc[i])
|
||||
resource["ages"] = get_range(df.iloc[i], 'Age Group:')
|
||||
resource["skills"] = get_selected_options(df.iloc[i], 'Skills:')
|
||||
resource["skill_levels"] = get_selected_options(df.iloc[i], 'Skill Level:')
|
||||
resource["payment_options"] = get_selected_options(df.iloc[i], 'Cost:')
|
||||
|
||||
print(f"Finished parsing resource on line {i+2}:")
|
||||
print(resource)
|
||||
print("--------------------------------\n")
|
||||
|
||||
resources.append(resource)
|
||||
|
||||
print("Uploading to MongoDB...")
|
||||
upload_to_mongo(resources, ar_col)
|
||||
print("Upload success!")
|
||||
|
||||
if __name__ == "__main__":
|
||||
typer.run(main)
|
Reference in New Issue
Block a user