I really don’t understand about python compression because whenever I am trying to compress a folder or file I end up getting a very larger file 5.5 times bigger than the original file. Why does this happen? Is there any way I can compress a folder or a file with python and get an output that’s at most the size of the original file? Here is the code I am using.
JavaScript
x
22
22
1
import os, zipfile
2
3
def zipfiles(filename, destname):
4
try:
5
zf = zipfile.ZipFile(destname, 'w', zipfile.ZIP_DEFLATED)
6
for dirname, subdirs, files in os.walk(filename):
7
zf.write(dirname)
8
for filename in files:
9
zf.write(os.path.join(dirname, filename))
10
zf.close()
11
except Exception, e:
12
print str(e)
13
def main():
14
x = raw_input('Enter Filename: ')
15
while len(x) == 0:
16
x = raw_input('Enter Filename: ')
17
y = raw_input('Enter destination name: ')
18
while len(y) == 0:
19
y = raw_input('Enter destination name: ')
20
zipfiles(x, y+'.zip')
21
main()
22
Advertisement
Answer
Make sure that the destination .zip
file is not in the same folder you are compressing, otherwise your script may be adding a copy of the file being created to itself — which obviously will make it much bigger.
Here’s a revised version of your code that will skip the archive when it’s being created in the same directory folder:
JavaScript
1
27
27
1
import os, zipfile
2
3
def zipfiles(source_folder, destination_name):
4
source_folder = os.path.abspath(source_folder)
5
destination_path = os.path.abspath(destination_name)
6
try:
7
with zipfile.ZipFile(destination_name, 'w', zipfile.ZIP_DEFLATED) as zf:
8
for dirname, subdirs, files in os.walk(source_folder):
9
# zf.write(dirname) # Not needed.
10
for filename in files:
11
filepath = os.path.join(dirname, filename)
12
if filepath != destination_path: # Skip file being created.
13
zf.write(filepath)
14
except Exception as e:
15
print(e)
16
17
def main():
18
x = ''
19
while not x:
20
x = raw_input('Enter source folder name: ')
21
y = ''
22
while not y:
23
y = raw_input('Enter destination archive file name: ')
24
zipfiles(x, y+'.zip')
25
26
main()
27