diff options
-rwxr-xr-x | regenTheExpertTA.py | 74 | ||||
-rwxr-xr-x | regenWebAssign.py | 63 | ||||
-rwxr-xr-x | toBlackboardCSV.py | 12 |
3 files changed, 86 insertions, 63 deletions
diff --git a/regenTheExpertTA.py b/regenTheExpertTA.py index d0277bc..34c7f8e 100755 --- a/regenTheExpertTA.py +++ b/regenTheExpertTA.py @@ -9,25 +9,25 @@ import os infile = sys.argv[1] f = open(infile) -l= f.readlines() -h= l[0] -hsub=l[1] # TheExpertTA keep headers in 2 lines (mixed with max possible points) -maxPossible=l[1] +l = f.readlines() +h = l[0] +hsub = l[1] # TheExpertTA keep headers in 2 lines (mixed with max possible points) +maxPossible = l[1] f.close() # clean up of headers -h=h.strip() -h = h.replace('"', '') +h = h.strip() +h = h.replace('"', "") hsub = hsub.strip() -hsub = hsub.replace('"', '') -hsub = hsub.split(',') -headers = h.split(',') +hsub = hsub.replace('"', "") +hsub = hsub.split(",") +headers = h.split(",") # we should fail hard if this column names are not present -headers[hsub.index('Last')]='LastName' -headers[hsub.index('First')]='FirstName' -headers[hsub.index('Email')]='UserName' -headers[hsub.index('Student No')]='SID' +headers[hsub.index("Last")] = "LastName" +headers[hsub.index("First")] = "FirstName" +headers[hsub.index("Email")] = "UserName" +headers[hsub.index("Student No")] = "SID" # headers[0]='FullName' # headers[1]='UserName' @@ -38,16 +38,19 @@ headers[hsub.index('Student No')]='SID' d = pd.read_csv(infile, skiprows=[0], header=None, names=headers) # First row contains max points information, so let's reassign it -d.loc[0, 'UserName']='_Max_Points_' -d.loc[0, 'LastName']='MaxScore' -d.loc[0, 'FirstName']='MaxScore' -d.loc[0, 'SID']=pd.NA +d.loc[0, "UserName"] = "_Max_Points_" +d.loc[0, "LastName"] = "MaxScore" +d.loc[0, "FirstName"] = "MaxScore" +d.loc[0, "SID"] = pd.NA -specialUsers=[] -specialUsers.append('_Max_Points_') +specialUsers = [] +specialUsers.append("_Max_Points_") # lets add row which will be in charge of the column type -d=pd.concat([d, pd.DataFrame({'UserName': ['_Col_Category_']}, columns=d.columns)], ignore_index=True) -specialUsers.append('_Col_Category_') +d = pd.concat( + [d, pd.DataFrame({"UserName": ["_Col_Category_"]}, columns=d.columns)], + ignore_index=True, +) +specialUsers.append("_Col_Category_") # cleanup # c = d.columns @@ -58,22 +61,24 @@ specialUsers.append('_Col_Category_') # d[index] = np.nan # TheExperTA last column contains 'Averages' per student which we do not need -d.drop(columns=['Averages'], inplace=True) +d.drop(columns=["Averages"], inplace=True) # TheExperTA last row contains Averages per assignment which we do not need -row = d[(d['LastName']=='Averages') & (d['FirstName'].isna()) & (d['UserName'].isna())] +row = d[ + (d["LastName"] == "Averages") & (d["FirstName"].isna()) & (d["UserName"].isna()) +] d.drop(row.index, inplace=True) # hand tuned fixes -d['UserName'].replace('@email.wm.edu$', '@wm.edu', regex=True, inplace=True) +d["UserName"].replace("@email.wm.edu$", "@wm.edu", regex=True, inplace=True) # d['UserName'].replace('phanng@hotmail.com@tj.va$', 'kphan@wm.edu', regex=True, inplace=True) # Now let's convert percentage which TheExperTA reports to points as GradeTable expects for c in d.columns: - if c in ['LastName', 'FirstName', 'UserName', 'SID']: + if c in ["LastName", "FirstName", "UserName", "SID"]: continue - maxP = d.loc[(d['UserName'] == '_Max_Points_')][c].values[0] - index = ~d['UserName'].isin( specialUsers ) - d.loc[index,c] *= maxP/100 # convert percentage to points + maxP = d.loc[(d["UserName"] == "_Max_Points_")][c].values[0] + index = ~d["UserName"].isin(specialUsers) + d.loc[index, c] *= maxP / 100 # convert percentage to points # TheExpertTA due to their percentage system generates +/- 0.0000001 scores # which is useless and make very long numbers in tables. @@ -81,15 +86,16 @@ for c in d.columns: d.loc[index, c] = d.loc[index, c].round(4) # now we are trying to guess column category - if 'hw' in c.lower(): - d.loc[(d['UserName'] == '_Col_Category_'), c] = 'HomeWork' + if "hw" in c.lower(): + d.loc[(d["UserName"] == "_Col_Category_"), c] = "HomeWork" -d.to_csv('TheExpertTA.csv', index=False) +d.to_csv("TheExpertTA.csv", index=False) # now import to sqlite3 -os.popen('rm -f TheExpertTA.db') -p = os.popen('printf ".mode csv\n.import \"TheExpertTA.csv\" export_table\n.q" | sqlite3 TheExpertTA.db') +os.popen("rm -f TheExpertTA.db") +p = os.popen( + 'printf ".mode csv\n.import "TheExpertTA.csv" export_table\n.q" | sqlite3 TheExpertTA.db' +) p.close() - diff --git a/regenWebAssign.py b/regenWebAssign.py index 007dc2d..18e9841 100755 --- a/regenWebAssign.py +++ b/regenWebAssign.py @@ -9,44 +9,51 @@ import os infile = sys.argv[1] f = open(infile) -l= f.readlines() -h= l[4] -maxPossible=l[6] +l = f.readlines() +h = l[4] +maxPossible = l[6] f.close() # clean up of headers -h=h.strip() -h = h.replace('"', '') -headers = h.split(',') -headers[0]='FullName' -headers[1]='UserName' -headers[2]='SID' -headers[3]='TotalPcnt' -headers[4]='TotalScore' - -d = pd.read_csv(infile, skiprows=[0,1,2,3,4,5,7,8], header=None, names=headers) -d.loc[0, 'FullName']='MaxScore' -d.loc[0, 'UserName']='MaxScore' +h = h.strip() +h = h.replace('"', "") +headers = h.split(",") +headers[0] = "FullName" +headers[1] = "UserName" +headers[2] = "SID" +headers[3] = "TotalPcnt" +headers[4] = "TotalScore" + +d = pd.read_csv(infile, skiprows=[0, 1, 2, 3, 4, 5, 7, 8], header=None, names=headers) +d.loc[0, "FullName"] = "MaxScore" +d.loc[0, "UserName"] = "MaxScore" # cleanup c = d.columns -c=c.drop(['FullName', 'UserName', 'SID']) -index = d[c] == 'ND' +c = c.drop(["FullName", "UserName", "SID"]) +index = d[c] == "ND" d[index] = np.nan -index = d[c] == 'NS' +index = d[c] == "NS" d[index] = np.nan -d['UserName'].replace('@wm$', '', regex=True, inplace=True) -d['UserName'].replace('@email.wm.edu$', '@wm.edu', regex=True, inplace=True) +d["UserName"].replace("@wm$", "", regex=True, inplace=True) +d["UserName"].replace("@email.wm.edu$", "@wm.edu", regex=True, inplace=True) # hand tuned fixes -d['UserName'].replace('phanng@hotmail.com@tj.va$', 'kphan@wm.edu', regex=True, inplace=True) -d['UserName'].replace('chipkd2001@gmail.com$', 'ckdangerio@wm.edu', regex=True, inplace=True) -d['UserName'].replace('eliasarivera@live.com@schs.va$', 'earivera@wm.edu', regex=True, inplace=True) - -d.to_csv('WebAssign.csv', index=False) +d["UserName"].replace( + "phanng@hotmail.com@tj.va$", "kphan@wm.edu", regex=True, inplace=True +) +d["UserName"].replace( + "chipkd2001@gmail.com$", "ckdangerio@wm.edu", regex=True, inplace=True +) +d["UserName"].replace( + "eliasarivera@live.com@schs.va$", "earivera@wm.edu", regex=True, inplace=True +) + +d.to_csv("WebAssign.csv", index=False) # now import to sqlite3 -os.popen('rm -f WebAssign.db') -p = os.popen('printf ".mode csv\n.import \"WebAssign.csv\" export_table\n.q" | sqlite3 WebAssign.db') +os.popen("rm -f WebAssign.db") +p = os.popen( + 'printf ".mode csv\n.import "WebAssign.csv" export_table\n.q" | sqlite3 WebAssign.db' +) p.close() - diff --git a/toBlackboardCSV.py b/toBlackboardCSV.py index 019158c..fdf16da 100755 --- a/toBlackboardCSV.py +++ b/toBlackboardCSV.py @@ -36,6 +36,16 @@ infoCol = [ ] dOut = dOut.drop(infoCol, axis=1) -fout = "BlackBoard.csv" +# drop non gradable columns +cCat = dIn["UserName"] == "_Col_Category_" +colToDrop = [] +for c in dOut.columns: + if c == "Username": + continue + category = dIn[cCat][c][0] + if category not in ["HomeWork", "MidTerm", "FinalExam", "weighted_column"]: + colToDrop.append(c) +dOut = dOut.drop(colToDrop, axis=1) + dOut.to_csv("BlackBoard.csv", index=False) print(f"Data was exported to {fout}") |