diff --git a/crawler.py b/crawler.py index b4445be..e739ef6 100644 --- a/crawler.py +++ b/crawler.py @@ -82,7 +82,7 @@ def filteringcon(filters_regex_one): with open(filters_regex_one) as f: file = f.read().split('\n') for i in range(len(file)): - file[i] = re.sub('(..*#..*)|(@@\|\|..*)|(\|\|..*\/..*)|(^\/..*)|(^..*\$app=..*)|(^..*\$removeparam=..*)|(^..\/..*)|(\$..*)|(^\...*)|(^:..*)|(^\|http)|(^@@..*)|(^_..*)|(^\*..*)|(^&..*)|(^-..*)', '', file[i]) + file[i] = re.sub('(@@\|\|..*)|(\|\|..*\/..*)|(^\|http)|(^(_|\*|&|\-|\/|\.|:|@@|\?|\=|\;)..*)|(..*(#|\$)..*)|(^..*\$(app=|removeparam=)..*)|(\|\|..*\/..*)', '', file[i]) file[i] = re.sub('0\.0\.0\.0 0\.0\.0\.0\Z', '', file[i]) file[i] = re.sub('\A'+str(IP4)+' ', '', file[i]) file[i] = re.sub('\A'+str(IP6)+' ', '', file[i])