diff --git a/export.py b/export.py index 15f937a..b10aab0 100644 --- a/export.py +++ b/export.py @@ -42,6 +42,8 @@ class MyHTMLParser(HTMLParser): self.captions = [] self.title = "" self.description = "" + self.inittitle = "" + self.initdescription = "" def check_attr(self, attrs, attr, value): @@ -63,6 +65,10 @@ class MyHTMLParser(HTMLParser): self.captions[len(self.captions)-1]["endTime"] = int(self.get_attr(attrs, "data-end-ms")) elif tag == "input" and self.check_attr(attrs, "id", "metadata-title"): self.title = self.get_attr(attrs, "value") + elif tag == "textarea" and self.check_attr(attrs, "id", "metadata-description"): + self.initdescription = self.get_attr(attrs, "data-original-description") + elif tag == "input" and self.check_attr(attrs, "id", "metadata-title"): + self.inittitle = self.get_attr(attrs, "data-original-title") def handle_data(self, data): if self.get_starttag_text() and self.get_starttag_text().startswith("