From f8e482ed42eb5326cccec1ad92127774a068de33 Mon Sep 17 00:00:00 2001 From: Antonio Ospite Date: Sat, 26 Nov 2011 12:56:54 +0100 Subject: [PATCH 1/1] winfreed.py: use the file name from Content-Disposition if available Some servers provide a Content-Disposition header with indication about the filename of the object served, use this instead of the name in the URL if this information is available. --- winfreed.py | 13 ++++++++++++- 1 file changed, 12 insertions(+), 1 deletion(-) diff --git a/winfreed.py b/winfreed.py index 108b719..a53bda8 100755 --- a/winfreed.py +++ b/winfreed.py @@ -17,6 +17,7 @@ # You should have received a copy of the GNU General Public License # along with this program. If not, see . +import re import os import sys import glob @@ -67,7 +68,17 @@ def download(pkg): pass response = urllib2.urlopen(url) - filename = urllib2.unquote(os.path.basename(response.geturl())) + + filename = "" + if 'Content-Disposition' in response.info(): + # Use the filename the server tells us if any, + # re pattern from http://stackoverflow.com/questions/8035900 + content_disposition = response.info().getheader('Content-Disposition').strip() + filename = re.findall("filename=(\S+)", content_disposition)[0] + + if filename == "": + filename = urllib2.unquote(os.path.basename(response.geturl())) + if filename == "": sys.stderr.write("Debug (%s): filename: %s url: %s\n" %(pkg['package_name'], filename, response.geturl())) return -- 2.1.4