from bs4 import BeautifulSoup import httpx class RedditComments: def __init__(self, link): page = httpx.get(link) content = page.text self.soup = BeautifulSoup(content) self.commentObjects = self.soup.find_all("div", "Comment") self.comments = [] def getHeader(self, commentObj): headers = commentObj.find_all("a") username = headers[0]["href"].split("/")[2] date = headers[1].text return username + " " + date def getText(self, commentObj): p = commentObj.find("p") if p is not None: return p.text else: return "" def getComments(self): for co in self.commentObjects: self.comments.append(self.getHeader(co) + "\n" + self.getText(co) + "\n")