#!/usr/bin/python # -*-coding:utf-8 -* import re import os import sys import tempfile sujet = [] sujetT = [] new_file, filename = tempfile.mkstemp() if not new_file: filename = "index.html" os.system("wget " + sys.argv[1] + " -O " + filename + " -N -q") os.system("sed -i 's/<\\/a>/<\\/a>\\n/g' " + filename) regex = '(File : |File)(.*?)' regex = '' dumpDir = "dump" if len(sys.argv) >= 3: dumpDir = sys.argv[2] os.system("mkdir -p " + dumpDir) with open(filename, 'r') as f: for line in f: yes = re.search(regex, line) if yes: print(yes.group(1)) sujetT.append([yes.group(1)]) print("Téléchargement de : " + yes.group(1)) os.system("wget " + 'http:' + yes.group(1) + " -N -q") os.system("mv " + yes.group(1)[yes.group(1).rfind('/')+1:] + " " + dumpDir) os.remove(filename)