Revision: 1837
Updated Code
at November 9, 2006 23:57 by whitetiger
Updated Code
import os,re,sys # python script.py file.html links = re.compile('[<].?[Aa].*[Hh][Rr][Ee][Ff].*=.*[\"\']?.*[\"\']?.?[>]') lunghezza_file = os.stat(sys.argv[1])[6] f = open(sys.argv[1], 'r') while(lunghezza_file > 0): riga = f.readline() lunghezza_file -= len(riga) if links.search(riga): comparazione = links.search(riga) output = comparazione.group(0) links2 = re.compile('http:-*[Zz][Ii][Pp]') if links2.search(output): output2 = links2.search(output) print output2.group(0) print 'FATTO'
Revision: 1836
Initial Code
Initial URL
Initial Description
Initial Title
Initial Tags
Initial Language
at November 9, 2006 23:55 by whitetiger
Initial Code
import os,re,sys # python script.py file.html links = re.compile('[<].?[Aa].*[Hh][Rr][Ee][Ff].*=.*[\"\']?.*[\"\']?.?[>]') lunghezza_file = os.stat(sys.argv[1])[6] f = open(sys.argv[1], 'r') while(lunghezza_file > 0): riga = f.readline() lunghezza_file -= len(riga) if links.search(riga): comparazione = links.search(riga) output = comparazione.group(0) links2 = re.compile('http:-*[Zz][Ii][Pp]') if links2.search(output): output2 = links2.search(output) print output2.group(0) print 'FATTO'
Initial URL
Initial Description
Initial Title
Python - Cattura tutti i links <a href=
Initial Tags
regex, python
Initial Language
Python