| 1 |
"""
|
| 2 |
|
| 3 |
SF-SubjectLineDeconstructor
|
| 4 |
|
| 5 |
Created by:
|
| 6 |
Emanuel Borges
|
| 7 |
09.21.2023
|
| 8 |
|
| 9 |
Very simple program that will read a list of subject lines and deconstruct them to consilidate them into a list of something attorneys
|
| 10 |
can use to pull out responsive terms.
|
| 11 |
|
| 12 |
"""
|
| 13 |
|
| 14 |
def ProcessLine(line, removalList):
|
| 15 |
line = line.strip()
|
| 16 |
for begVal in removalList:
|
| 17 |
if line.startswith(begVal):
|
| 18 |
line = line.replace(begVal,"",1)
|
| 19 |
return line.strip()
|
| 20 |
|
| 21 |
|
| 22 |
if __name__ == '__main__':
|
| 23 |
removalList = ['[EXTERNAL] ', 'RE: ', 'FW: ','Accepted: ','Canceled: ','Tentative: ', 'Re: ', 'Fw: ', 'Fwd: ', 'Automatic reply: ', 'Declined: ', '[EXTERNAL EMAIL] ']
|
| 24 |
sfInputFileName = r"C:\Users\eborges\Documents\Cases\State Farm\subject_line_raw.txt"
|
| 25 |
|
| 26 |
outputFileName = r"C:\Users\eborges\Documents\Cases\State Farm\subject_line_EB.txt"
|
| 27 |
|
| 28 |
sfSubjectSet = set()
|
| 29 |
|
| 30 |
contents = open(sfInputFileName).readlines()
|
| 31 |
print(f"This file contains {len(contents)} lines.")
|
| 32 |
for line in contents:
|
| 33 |
line = line.replace("\n","")
|
| 34 |
begLineTest = True
|
| 35 |
while begLineTest == True:
|
| 36 |
begLineTest = False
|
| 37 |
for begVal in removalList:
|
| 38 |
if line.startswith(begVal):
|
| 39 |
begLineTest = True
|
| 40 |
line = ProcessLine(line, removalList)
|
| 41 |
|
| 42 |
sfSubjectSet.add(line)
|
| 43 |
|
| 44 |
outputFile = open(outputFileName,'w')
|
| 45 |
sfSubJectList = list(sfSubjectSet)
|
| 46 |
sfSubJectList.sort()
|
| 47 |
for i in sfSubJectList:
|
| 48 |
outputFile.write(f"{i}\n")
|
| 49 |
outputFile.close() |