#!/usr/bin/python # -*-coding:utf-8 -* import re, os, sys sujet = [] sujetT = [] os.system("wget " + sys.argv[1] + " -O index.html -N -q") os.system("sed -i 's/<\\/a>/<\\/a>\\n/g' index.html") regex = '(File : |File)(.*?)' regex = '' dumpDir = "dump" if len(sys.argv) >= 3 : dumpDir = sys.argv[2] os.system("mkdir -p " + dumpDir) with open("index.html",'r') as f: for line in f: yes = re.search(regex, line) if yes : print(yes.group(1)) sujetT.append( [yes.group(1)] ) print( "Téléchargement de : " + yes.group(1) ) os.system("wget " + 'http:' + yes.group(1) + " -N -q") os.system("mv " + yes.group(1)[yes.group(1).rfind('/')+1:] + " " + dumpDir)