diff --git a/consensus_and_scoring/TriagerScoring.py b/consensus_and_scoring/TriagerScoring.py index b2f1cdc..908d767 100644 --- a/consensus_and_scoring/TriagerScoring.py +++ b/consensus_and_scoring/TriagerScoring.py @@ -43,7 +43,7 @@ def importData(path, out_path): #redundancy = art_data[''] length = art_data['article_text_length'].iloc[0] #print(length) - source_text = makeList(length) + source_text = makeList(length + 1) #flagExclusions = exclusionList(users, flags, cats) flagExclusions = [] #print(flagExclusions) @@ -225,6 +225,11 @@ def determinePassingIndices(starts, ends, numUsers, users, length, category): 'passingFunc': evalThresholdMatrix, 'scale': 1.8 }, + 'Junk Text': + { + 'passingFunc': ignoreThis, + 'scale': 0 + } } passFunc = actionDeterminant[category]['passingFunc'] scale = actionDeterminant[category]['scale'] @@ -245,6 +250,9 @@ def findPassingIndices(starts, ends, numUsers, users, length, passingFunc = eval passersArray[i] = 1 return passersArray +def ignoreThis(percent, TotalNumUsers, scale): + return 'X' + def minPercent(percent, totalNumUsers, scale): if percent>=scale: return 'H' @@ -354,6 +362,7 @@ def addToSourceText(starts, ends, texts, sourceText): sourceText[c] = texts[i][pointer] pointer +=1 return sourceText + def makeList(size): out = [] for i in range(size): @@ -363,7 +372,8 @@ def makeList(size): def getText(start,end, sourceText): out = '' for i in range(int(start),int(end)): - out = out+sourceText[i] + if i < len(sourceText) - 1: + out = out+ str(sourceText[i]) return out