Revision: 6505
Initial Code
Initial URL
Initial Description
Initial Title
Initial Tags
Initial Language
at May 25, 2008 14:02 by abhiomkar
Initial Code
#!/usr/bin/python import sgmllib import sys class MyParser(sgmllib.SGMLParser): "A simple parser class." def parse(self, s): "Parse the given string 's'." self.feed(s) self.close() def __init__(self, verbose=0): "Initialise an object, passing 'verbose' to the superclass." sgmllib.SGMLParser.__init__(self, verbose) self.hyperlinks = [] def start_a(self, attributes): "Process a hyperlink and its 'attributes'." for name, value in attributes: if name == "href": if value.startswith("/watch?v="): self.hyperlinks.append("youtube-dl -t http://youtube.com"+value) def get_hyperlinks(self): "Return the list of hyperlinks." return self.hyperlinks def f2(seq): # order preserving checked = [] for e in seq: if e not in checked: checked.append(e) return checked import urllib, sgmllib # Get something to work with. f = urllib.urlopen(sys.argv[1]) s = f.read() # Try and process the page. # The class should have been defined first, remember. myparser = MyParser() myparser.parse(s) # Get the hyperlinks. print f2(myparser.get_hyperlinks()) yt = open("youtube_links","w") for link in f2(myparser.get_hyperlinks()): yt.write(link) yt.write("\n") print "\nYouTube Batch Download Script \"youtube_links\" has been generated. Execute it !"
Initial URL
Initial Description
You
Initial Title
YouTube Batch Download Script
Initial Tags
python, download
Initial Language
Python