Skip to content

Commit

Permalink
Merge pull request #1835 from TrellixVulnTeam/main
Browse files Browse the repository at this point in the history
  • Loading branch information
miguelgfierro authored Oct 27, 2022
2 parents e66bf99 + fb53363 commit d61ca14
Showing 1 changed file with 20 additions and 1 deletion.
21 changes: 20 additions & 1 deletion recommenders/datasets/criteo.py
Original file line number Diff line number Diff line change
Expand Up @@ -157,7 +157,26 @@ def extract_criteo(size, compressed_file, path=None):
extracted_dir = path

with tarfile.open(compressed_file) as tar:
tar.extractall(extracted_dir)
def is_within_directory(directory, target):

abs_directory = os.path.abspath(directory)
abs_target = os.path.abspath(target)

prefix = os.path.commonprefix([abs_directory, abs_target])

return prefix == abs_directory

def safe_extract(tar, path=".", members=None, *, numeric_owner=False):

for member in tar.getmembers():
member_path = os.path.join(path, member.name)
if not is_within_directory(path, member_path):
raise Exception("Attempted Path Traversal in Tar File")

tar.extractall(path, members, numeric_owner=numeric_owner)


safe_extract(tar, extracted_dir)

filename_selector = {"sample": "dac_sample.txt", "full": "train.txt"}
return os.path.join(extracted_dir, filename_selector[size])
Expand Down

0 comments on commit d61ca14

Please sign in to comment.