From 05ba1d01f6dec6bc6d44f57cdb3b4b6bc50ead23 Mon Sep 17 00:00:00 2001 From: khuxkm Date: Fri, 3 Aug 2018 01:26:39 -0400 Subject: [PATCH] Text file name normalizer now removes punctuation from titles --- transgrab.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/transgrab.py b/transgrab.py index 20bae09..81ea442 100644 --- a/transgrab.py +++ b/transgrab.py @@ -1,4 +1,4 @@ -import requests, re +import requests, re, string from jsonpath import jsonpath from urllib.parse import quote as raw_quote import argparse @@ -29,7 +29,7 @@ def processTranscript(r,dir_style=1): return "\n".join(text) def normalize(t): - return t.lower().replace(" ","_") + return "".join(filter(lambda x: not x in string.punctuation,t.lower())).replace(" ","_") if __name__=="__main__": parser = argparse.ArgumentParser(description="Grabs transcripts.")