diff --git a/transgrab.py b/transgrab.py index 20bae09..81ea442 100644 --- a/transgrab.py +++ b/transgrab.py @@ -1,4 +1,4 @@ -import requests, re +import requests, re, string from jsonpath import jsonpath from urllib.parse import quote as raw_quote import argparse @@ -29,7 +29,7 @@ def processTranscript(r,dir_style=1): return "\n".join(text) def normalize(t): - return t.lower().replace(" ","_") + return "".join(filter(lambda x: not x in string.punctuation,t.lower())).replace(" ","_") if __name__=="__main__": parser = argparse.ArgumentParser(description="Grabs transcripts.")