summary |
shortlog |
log |
commit | commitdiff |
tree
raw |
patch |
inline | side by side (from parent 1:
1d965dd)
Some servers provide a Content-Disposition header with indication about
the filename of the object served, use this instead of the name in the
URL if this information is available.
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
import os
import sys
import glob
import os
import sys
import glob
pass
response = urllib2.urlopen(url)
pass
response = urllib2.urlopen(url)
- filename = urllib2.unquote(os.path.basename(response.geturl()))
+
+ filename = ""
+ if 'Content-Disposition' in response.info():
+ # Use the filename the server tells us if any,
+ # re pattern from http://stackoverflow.com/questions/8035900
+ content_disposition = response.info().getheader('Content-Disposition').strip()
+ filename = re.findall("filename=(\S+)", content_disposition)[0]
+
+ if filename == "":
+ filename = urllib2.unquote(os.path.basename(response.geturl()))
+
if filename == "":
sys.stderr.write("Debug (%s): filename: %s url: %s\n" %(pkg['package_name'], filename, response.geturl()))
return
if filename == "":
sys.stderr.write("Debug (%s): filename: %s url: %s\n" %(pkg['package_name'], filename, response.geturl()))
return