vlang
diff --git a/‎examples/archive/tar_gz_reader.v‎
Lines changed: 166 additions & 0 deletions b/‎examples/archive/tar_gz_reader.v‎
Lines changed: 166 additions & 0 deletions
diff --git a/‎vlib/archive/README.md‎
Lines changed: 3 additions & 0 deletions b/‎vlib/archive/README.md‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎vlib/archive/tar/README.md‎
Lines changed: 33 additions & 0 deletions b/‎vlib/archive/tar/README.md‎
Lines changed: 33 additions & 0 deletions
@@ -0,0 +1,166 @@
+import archive.tar
+import flag
+import net.http
+import os
+import term
+
+const default_url = 'https://github.com/vlang/v/archive/refs/tags/v0.1.3.tar.gz'
+
+@[heap]
+struct Context {
+	url        string // Web starting with http:// or https://. Local starting with file:///
+	chunks     bool   // true: decompress with callback
+	debug      int    // print debug lines
+	max_blocks int    // if max_blocks > 0 and is reached stops early.
+	filename   string // if filename is found as a path of a data block, stops early.
+}
+
+fn (ctx &Context) read_last_block(mut read tar.Read) bool {
+	if ctx.max_blocks > 0 && ctx.max_blocks < read.get_block_number() {
+		read.stop_early = true
+		return true
+	}
+	return false
+}
+
+fn new_context() !&Context {
+	mut fp := flag.new_flag_parser(os.args)
+	fp.application('tar_gz_reader')
+	fp.version('0.0.20250721')
+	fp.description('Reads into memory selected sections of *.tar.gz. archives from https or home_dir.')
+	fp.skip_executable()
+	ctx := &Context{
+		url:        fp.string('url', `u`, default_url, 'archive *.tar.gz URL, default(${default_url}). Start name with file:/// for local')
+		chunks:     fp.bool('chunks', `c`, false, 'decompress with chunks to reduce RAM usage, default(false)')
+		debug:      fp.int('debug', `d`, 0, 'prints blocks: 1=other, 2:+dirs, 3=+files, 4=+data, default(0=silent)')
+		max_blocks: fp.int('max_blocks', `m`, 0, 'maximum blocks to read, stop early. Default(0=read all)')
+		filename:   fp.string('filename', `f`, '', 'filename content complete print, stop early. Default(empty means none)')
+	}
+	additional := fp.finalize()!
+	if additional.len > 0 {
+		println('unprocessed args ${additional.join_lines()}')
+	}
+	return ctx
+}
+
+// Downloader downloads a *.tar.gz using HTTP chunks
+struct Downloader {
+mut:
+	chunks int
+	data   []u8
+}
+
+fn new_downloader(url string) !&Downloader {
+	mut downloader := &Downloader{}
+	params := http.DownloaderParams{
+		downloader: downloader
+	}
+	if url.starts_with('http://') || url.starts_with('https://') {
+		http.download_file_with_progress(url, '', params)!
+	} else if url.starts_with('file:///') {
+		path := '${os.home_dir()}/${url[8..]}'
+		println('path ${path}')
+		downloader.data = os.read_bytes(path)!
+	}
+	return downloader
+}
+
+fn (mut d Downloader) on_start(mut request http.Request, path string) ! {}
+
+fn (mut d Downloader) on_chunk(request &http.Request, chunk []u8, already_received u64, expected u64) ! {
+	if expected == 0 {
+		return
+	}
+	d.chunks++
+	d.data << chunk
+}
+
+fn (mut d Downloader) on_finish(request &http.Request, response &http.Response) ! {}
+
+struct FileReader implements tar.Reader {
+	ctx &Context
+mut:
+	filepath string
+	content  []u8
+}
+
+fn new_file_reader(ctx &Context) FileReader {
+	return FileReader{
+		ctx: ctx
+	}
+}
+
+fn (mut f FileReader) other_block(mut read tar.Read, details string) {
+	if f.ctx.read_last_block(mut read) {
+		return
+	}
+	if f.ctx.debug > 0 {
+		row := 'OTHER  block:${read.get_block_number():6} ${read.get_special()} ${details} ${read.get_path()} '
+		println(term.colorize(term.bright_yellow, row))
+	}
+}
+
+fn (mut f FileReader) dir_block(mut read tar.Read, size u64) {
+	if f.ctx.read_last_block(mut read) {
+		return
+	}
+	if f.ctx.debug > 1 {
+		row := 'DIR    block:${read.get_block_number():6} ${read.get_path()} size:${size}'
+		println(term.colorize(term.green, row))
+	}
+}
+
+fn (mut f FileReader) file_block(mut read tar.Read, size u64) {
+	if f.ctx.read_last_block(mut read) {
+		return
+	}
+	path := read.get_path()
+	if f.ctx.debug > 2 {
+		row := ' FILE  block:${read.get_block_number():6} ${path} size:${size}'
+		println(term.colorize(term.bright_blue, row))
+	}
+	if f.ctx.filename != '' && f.filepath == '' && path.ends_with(f.ctx.filename) {
+		f.filepath = path
+	}
+}
+
+fn (mut f FileReader) data_block(mut read tar.Read, data []u8, pending int) {
+	if f.ctx.read_last_block(mut read) {
+		return
+	}
+	path := read.get_path()
+	if f.ctx.debug > 3 {
+		println('  DATA block:${read.get_block_number():6} ${path} len:${data.len} pend:${pending}')
+	}
+	if f.ctx.filename != '' {
+		if f.filepath == path {
+			f.content << data
+			if pending == 0 {
+				// our file of interest data is complete
+				read.stop_early = true
+			}
+		}
+	}
+}
+
+fn main() {
+	ctx := new_context()!
+	reader := FileReader{
+		ctx: ctx
+	}
+	mut untar := tar.new_untar(reader)
+	mut decompressor := tar.new_decompresor(untar)
+	downloader := new_downloader(ctx.url)!
+	if ctx.chunks {
+		decompressor.read_chunks(downloader.data)!
+	} else {
+		decompressor.read_all(downloader.data)!
+	}
+	println('-'.repeat(80))
+	println('Download: ${ctx.url} chunks:${downloader.chunks} bytes=${downloader.data.len}')
+	println('Untar:    ${untar}')
+	println('Content:  Path:${reader.filepath} bytes:${reader.content.len}')
+	println('-'.repeat(80))
+	println('${reader.content.bytestr()}')
+	println('-'.repeat(80))
+}
@@ -0,0 +1,3 @@
+## Description
+
+`archive` is a namespace for different archive formats like `tar` or `zip`.
@@ -0,0 +1,33 @@
+## Description
+
+`tar` is a module to access tar archives.
+
+Tape archives (tar) are a file format for storing a sequence of files that can be read and written 
+as streams. This module covers the reading of the basic sections of archives produced by GNU tools
+like Linux command `tar -xvf` but in memory instead modifing the filesystem. Parses directories, 
+files, and file's content and manage paths longer than 100 chars.
+
+### Read Efficiency
+
+An entire tar file can be read in memory or by chunks. Keeps in memory a single decompressed 
+[chunk](https://modules.vlang.io/compress.gzip.html#decompress_with_callback) of 32 KB at a time 
+and also keeps in memory a single tar block of 512 bytes at a time. Convert paths to strings until 
+needed and the user reader implementation can stop early the reading process.
+
+### Read Example
+
+The tar blocks are parsed and some fields are passed to `Reader` implemented methods.
+
+```v
+import os
+import archive.tar
+
+fn main() {
+	os.chdir(@VMODROOT) or {}
+	path := 'archive/tar/testdata/life.tar.gz'
+	reader := tar.new_debug_reader()
+	tar.read_tar_gz_file(path, reader)!
+}
+```
+Look also in `examples` folder the `tar_gz_reader.v` program.
+
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+## Description`
	`2`	`+`
	`3`	+`archive` is a namespace for different archive formats like `tar` or `zip`.