From 738da1a2f97588d454b5fb02a17e343ce0af29a7 Mon Sep 17 00:00:00 2001 From: ktock Date: Mon, 1 Jun 2020 13:30:59 +0900 Subject: [PATCH] Prevent the prefetch from making big HTTP request header During prefetch, current filesystem implementation chunks this prefetching range into small, many, and mostly neighbouring chunks and lists them in a single HTTP Range Request header without enough squashing. Sometimes this leads to large HTTP header and the request fails. This commit solves this by aggressively squashing neighbouring/overwrapping chunks in HTTP headers, as much as possible. Signed-off-by: Kohei Tokunaga --- stargz/remote/util.go | 57 ++++++++++++++++++++++++++++---------- stargz/remote/util_test.go | 14 +++++++++- 2 files changed, 55 insertions(+), 16 deletions(-) diff --git a/stargz/remote/util.go b/stargz/remote/util.go index 3a7c7e1a0..1fd3899bf 100644 --- a/stargz/remote/util.go +++ b/stargz/remote/util.go @@ -46,31 +46,58 @@ func superRegion(regs []region) region { // regionSet is a set of regions type regionSet struct { - rs []region + rs []region // must be kept sorted } -// add attempts to merge r to rs.rs +// add attempts to merge r to rs.rs with squashing the regions as +// small as possible. This operation takes O(n). +// TODO: more efficient way to do it. func (rs *regionSet) add(r region) { - for i := range rs.rs { - f := &rs.rs[i] - if r.b <= f.b && f.b <= r.e+1 && r.e <= f.e { - f.b = r.b + // Iterate over the sorted region slice from the tail. + // a) When an overwrap occurs, adjust `r` to fully contain the looking region + // `l` and remove `l` from region slice. + // b) Once l.e become less than r.b, no overwrap will occur again. So immediately + // insert `r` which fully contains all overwrapped regions, to the region slice. + // Here, `r` is inserted to the region slice with keeping it sorted, without + // overwrapping to any regions. + // *) If any `l` contains `r`, we don't need to do anything so return immediately. + for i := len(rs.rs) - 1; i >= 0; i-- { + l := &rs.rs[i] + + // *) l contains r + if l.b <= r.b && r.e <= l.e { return } - if f.b <= r.b && r.e <= f.e { - return + + // a) r overwraps to l so adjust r to fully contain l and reomve l + // from region slice. + if l.b <= r.b && r.b <= l.e+1 && l.e <= r.e { + r.b = l.b + rs.rs = append(rs.rs[:i], rs.rs[i+1:]...) + continue } - if f.b <= r.b && r.b <= f.e+1 && f.e <= r.e { - f.e = r.e - return + if r.b <= l.b && l.b <= r.e+1 && r.e <= l.e { + r.e = l.e + rs.rs = append(rs.rs[:i], rs.rs[i+1:]...) + continue } - if r.b <= f.b && f.e <= r.e { - f.b = r.b - f.e = r.e + if r.b <= l.b && l.e <= r.e { + rs.rs = append(rs.rs[:i], rs.rs[i+1:]...) + continue + } + + // b) No overwrap will occur after this iteration. Instert r to the + // region slice immediately. + if l.e < r.b { + rs.rs = append(rs.rs[:i+1], append([]region{r}, rs.rs[i+1:]...)...) return } + + // No overwrap occurs yet. See the next region. } - rs.rs = append(rs.rs, r) + + // r is the topmost region among regions in the slice. + rs.rs = append([]region{r}, rs.rs...) } func (rs *regionSet) totalSize() int64 { diff --git a/stargz/remote/util_test.go b/stargz/remote/util_test.go index 8058971c6..827c53438 100644 --- a/stargz/remote/util_test.go +++ b/stargz/remote/util_test.go @@ -46,7 +46,7 @@ func TestRegionSet(t *testing.T) { }, { input: []region{{2, 4}, {6, 8}, {1, 5}}, - expected: []region{{1, 5}, {6, 8}}, + expected: []region{{1, 8}}, }, { input: []region{{1, 2}, {1, 2}}, @@ -72,6 +72,18 @@ func TestRegionSet(t *testing.T) { input: []region{{4, 6}, {1, 3}}, // region.e is inclusive expected: []region{{1, 6}}, }, + { + input: []region{{4, 6}, {1, 3}, {7, 9}, {2, 8}}, + expected: []region{{1, 9}}, + }, + { + input: []region{{4, 6}, {1, 5}, {7, 9}, {4, 8}}, + expected: []region{{1, 9}}, + }, + { + input: []region{{7, 8}, {1, 2}, {5, 6}}, + expected: []region{{1, 2}, {5, 8}}, + }, } for i, tt := range tests { var rs regionSet