diff options
| author | David Oberhollenzer <david.oberhollenzer@sigma-star.at> | 2019-07-26 23:07:41 +0200 | 
|---|---|---|
| committer | David Oberhollenzer <david.oberhollenzer@sigma-star.at> | 2019-07-28 16:33:57 +0200 | 
| commit | cce36f459ddb5698fd1a40061c466996482146eb (patch) | |
| tree | 05037e8f8d18c850a2f8afeac427e3dcada717dc /tar | |
| parent | e480a7459377817fbab7029a7dad47c969b8dd97 (diff) | |
Implement fragment deduplication in data writer
The strategy is simple:
 - The data writer function that write data/fragment blocks get
   access to the list files.
 - When writing a fragment, we look for an already written file that has
   a fragment with the same size and checksum.
 - If we find one, we throw away the fragment and reuse the existing one.
Signed-off-by: David Oberhollenzer <david.oberhollenzer@sigma-star.at>
Diffstat (limited to 'tar')
| -rw-r--r-- | tar/tar2sqfs.c | 15 | 
1 files changed, 10 insertions, 5 deletions
diff --git a/tar/tar2sqfs.c b/tar/tar2sqfs.c index 625cec6..836df21 100644 --- a/tar/tar2sqfs.c +++ b/tar/tar2sqfs.c @@ -194,20 +194,20 @@ fail_arg:  }  static int write_file(tar_header_decoded_t *hdr, file_info_t *fi, -		      data_writer_t *data) +		      data_writer_t *data, file_info_t *list)  {  	int ret;  	if (hdr->sparse != NULL) {  		ret = write_data_from_fd_condensed(data, fi, STDIN_FILENO, -						   hdr->sparse, 0); +						   hdr->sparse, 0, list);  		if (ret)  			return -1;  		return skip_padding(STDIN_FILENO, hdr->record_size);  	} -	if (write_data_from_fd(data, fi, STDIN_FILENO, 0)) +	if (write_data_from_fd(data, fi, STDIN_FILENO, 0, list))  		return -1;  	return skip_padding(STDIN_FILENO, fi->size); @@ -259,8 +259,13 @@ static int create_node_and_repack_data(tar_header_decoded_t *hdr, fstree_t *fs,  			return -1;  	} -	if (S_ISREG(hdr->sb.st_mode)) -		return write_file(hdr, node->data.file, data); +	if (S_ISREG(hdr->sb.st_mode)) { +		if (write_file(hdr, node->data.file, data, fs->files)) +			return -1; + +		node->data.file->next = fs->files; +		fs->files = node->data.file; +	}  	return 0;  fail_errno:  | 
