8000 Improved positive_keywords and negative_keywords processing for the CLI · kingking888/python-readability@f7f439d · GitHub
[go: up one dir, main page]

Skip to content

Commit f7f439d

Browse files
committed
Improved positive_keywords and negative_keywords processing for the CLI
1 parent 0c8f040 commit f7f439d

File tree

1 file changed

+7
-8
lines changed

1 file changed

+7
-8
lines changed

readability/readability.py

Lines changed: 7 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -67,17 +67,16 @@ def text_length(i):
6767
def compile_pattern(elements):
6868
if not elements:
6969
return None
70+
elif isinstance(elements, regexp_type):
71+
return elements
7072
elif isinstance(elements, (str_, bytes_)):
7173
if isinstance(elements, bytes_):
7274
elements = str_(elements, 'utf-8')
7375
elements = elements.split(u',')
74-
return re.compile(u'|'.join([re.escape(x.lower()) for x in elements]), re.U)
75-
elif isinstance(elements, (list, tuple)):
76-
return list(elements)
77-
elif isinstance(elements, regexp_type):
78-
return elements
76+
if isinstance(elements, (list, tuple)):
77+
return re.compile(u'|'.join([re.escape(x.strip().lower()) for x in elements]), re.U)
7978
else:
80-
raise Exception("Unknown format for the pattern")
79+
raise Exception("Unknown type for the pattern: {}"< 91BC /span>.format(type(elements)))
8180
# assume string or string like object
8281

8382
class Document:
@@ -614,8 +613,8 @@ def main():
614613
parser.add_option('-l', '--log', default=None, help="save logs into file (appended)")
615614
parser.add_option('-u', '--url', default=None, help="use URL instead of a local file")
616615
parser.add_option('-x', '--xpath', default=None, help="add original xpath")
617-
parser.add_option('-p', '--positive-keywords', default=None, help="positive keywords (separated with comma)", action='store')
618-
parser.add_option('-n', '--negative-keywords', default=None, help="negative keywords (separated with comma)", action='store')
616+
parser.add_option('-p', '--positive-keywords', default=None, help="positive keywords (comma-separated)", action='store')
617+
parser.add_option('-n', '--negative-keywords', default=None, help="negative keywords (comma-separated)", action='store')
619618
(options, args) = parser.parse_args()
620619

621620
if options.verbose:

0 commit comments

Comments
 (0)
0