Skip to content

Commit

Permalink
Quick RSS fix
Browse files Browse the repository at this point in the history
  • Loading branch information
battleoverflow committed Nov 1, 2023
1 parent 8c8481b commit 1ed237e
Showing 1 changed file with 11 additions and 10 deletions.
21 changes: 11 additions & 10 deletions threatingestor/sources/rss.py
Original file line number Diff line number Diff line change
Expand Up @@ -54,16 +54,17 @@ def run(self, saved_state):
rss_exclude = re.sub(re.compile(fr"{self.exclude}", re.IGNORECASE), "", str(item.get('link')))

if rss_exclude:
if self.feed_type == "afterioc":
text = soup.get_text(separator=' ').split('Indicators of Compromise')[-1]
artifacts += self.process_element(text, item.get('link'), include_nonobfuscated=True)
elif self.feed_type == "clean":
text = soup.get_text(separator=' ')
artifacts += self.process_element(text, item.get('link'), include_nonobfuscated=True)
else:
# Default: self.feed_type == 'messy'.
text = soup.get_text(separator=' ')
artifacts += self.process_element(text, item.get('link'))
if "http" in rss_exclude:
if self.feed_type == "afterioc":
text = soup.get_text(separator=' ').split('Indicators of Compromise')[-1]
artifacts += self.process_element(text, item.get('link'), include_nonobfuscated=True)
elif self.feed_type == "clean":
text = soup.get_text(separator=' ')
artifacts += self.process_element(text, item.get('link'), include_nonobfuscated=True)
else:
# Default: self.feed_type == 'messy'.
text = soup.get_text(separator=' ')
artifacts += self.process_element(text, item.get('link'))

if self.include is not None:
rss_include = re.compile(r"{0}".format(self.include)).findall(str(self.include.split('|')))
Expand Down

0 comments on commit 1ed237e

Please sign in to comment.