diff --git a/cmd/hack/hack.go b/cmd/hack/hack.go index 8484094a2adbe3501e64c3ac38317e21054bdcc6..9130aabf262d649132da5964bad34b4c0b22fcd0 100644 --- a/cmd/hack/hack.go +++ b/cmd/hack/hack.go @@ -1785,7 +1785,7 @@ func compress1(chaindata string, name string) error { if err := reducedict(name); err != nil { return err } - if err := createIdx(*chainID, name, itemsCount); err != nil { + if err := _createIdx(*chainID, name, itemsCount); err != nil { return err } return nil @@ -2282,11 +2282,6 @@ func (hf *HuffmanCoder) flush() error { // reduceDict reduces the dictionary by trying the substitutions and counting frequency for each word func reducedict(name string) error { - go func() { - if err := http.ListenAndServe("localhost:6060", nil); err != nil { - log.Error("Failure in running pprof server", "err", err) - } - }() logEvery := time.NewTicker(20 * time.Second) defer logEvery.Stop() // Read up the dictionary @@ -2724,6 +2719,8 @@ func recsplitLookup(chaindata, name string) error { defer database.Close() chainConfig := tool.ChainConfigFromDB(database) chainID, _ := uint256.FromBig(chainConfig.ChainID) + logEvery := time.NewTicker(20 * time.Second) + defer logEvery.Stop() d, err := compress.NewDecompressor(name + ".compressed.dat") if err != nil { @@ -2752,20 +2749,56 @@ func recsplitLookup(chaindata, name string) error { wc++ t := time.Now() - offset := idx.Lookup(slot.IdHash[:]) + recID := idx.Lookup(slot.IdHash[:]) l1 += time.Since(t) - _ = idx.Lookup2(offset) + t = time.Now() + _ = idx.Lookup2(recID) l2 += time.Since(t) - if wc%10_000_000 == 0 { - log.Info("Checked", "millions", wc/1_000_000) + + select { + default: + case <-logEvery.C: + var m runtime.MemStats + runtime.ReadMemStats(&m) + log.Info("Checked", "millions", float64(wc)/1_000_000, + "lookup", time.Duration(int64(l1)/int64(wc)), "lookup2", time.Duration(int64(l2)/int64(wc)), + "alloc", common.StorageSize(m.Alloc), "sys", common.StorageSize(m.Sys), + ) } } + total = time.Since(start) log.Info("Average decoding time", "lookup", time.Duration(int64(l1)/int64(wc)), "lookup + lookup2", time.Duration(int64(l2)/int64(wc)), "items", wc, "total", total) return nil } -func createIdx(chainID uint256.Int, name string, count int) error { +func createIdx(chaindata string, name string) error { + database := mdbx.MustOpen(chaindata) + defer database.Close() + chainConfig := tool.ChainConfigFromDB(database) + chainID, _ := uint256.FromBig(chainConfig.ChainID) + d, err := compress.NewDecompressor(name + ".compressed.dat") + if err != nil { + return err + } + defer d.Close() + logEvery := time.NewTicker(20 * time.Second) + defer logEvery.Stop() + g := d.MakeGetter() + var word = make([]byte, 0, 4*1024) + wc := 0 + for g.HasNext() { + word, _ = g.Next(word[:0]) + wc++ + select { + default: + case <-logEvery.C: + log.Info("[Filling recsplit] Processed", "millions", wc/1_000_000) + } + } + return _createIdx(*chainID, name, wc) +} +func _createIdx(chainID uint256.Int, name string, count int) error { d, err := compress.NewDecompressor(name + ".compressed.dat") if err != nil { return err @@ -2812,7 +2845,7 @@ RETRY: select { default: case <-logEvery.C: - log.Info("[Creating index] Processed", "millions", wc/1_000_000) + log.Info("[Filling recsplit] Processed", "millions", wc/1_000_000) } } log.Info("Building recsplit...") @@ -2822,6 +2855,7 @@ RETRY: } if rs.Collision() { + log.Info("Building recsplit. Collision happened. It's ok. Restarting...") rs.ResetNextSalt() goto RETRY } @@ -4028,6 +4062,11 @@ func main() { } defer pprof.StopCPUProfile() } + go func() { + if err := http.ListenAndServe("localhost:6060", nil); err != nil { + log.Error("Failure in running pprof server", "err", err) + } + }() var err error switch *action { @@ -4174,6 +4213,8 @@ func main() { err = dumpState(*chaindata, int(*block), *name) case "compress": err = compress1(*chaindata, *name) + case "createIdx": + err = createIdx(*chaindata, *name) case "recsplitLookup": err = recsplitLookup(*chaindata, *name) case "decompress": diff --git a/go.mod b/go.mod index 4ec2df1fbfee8d39064f00d44c1586866b67c345..7be390240c81b2522a01df31fa320007e6368ded 100644 --- a/go.mod +++ b/go.mod @@ -36,7 +36,7 @@ require ( github.com/json-iterator/go v1.1.12 github.com/julienschmidt/httprouter v1.3.0 github.com/kevinburke/go-bindata v3.21.0+incompatible - github.com/ledgerwatch/erigon-lib v0.0.0-20211031023235-7582da6c7866 + github.com/ledgerwatch/erigon-lib v0.0.0-20211101021507-683d16a7a16e github.com/ledgerwatch/log/v3 v3.4.0 github.com/ledgerwatch/secp256k1 v0.0.0-20210626115225-cd5cd00ed72d github.com/logrusorgru/aurora/v3 v3.0.0 diff --git a/go.sum b/go.sum index 9dc4310472ed6283a71d81c3da607e0f8d8fbfd0..b5ef48e641512b09635fc74e0e2b1ef1d9b55105 100644 --- a/go.sum +++ b/go.sum @@ -497,8 +497,8 @@ github.com/kylelemons/godebug v0.0.0-20170224010052-a616ab194758 h1:0D5M2HQSGD3P github.com/kylelemons/godebug v0.0.0-20170224010052-a616ab194758/go.mod h1:B69LEHPfb2qLo0BaaOLcbitczOKLWTsrBG9LczfCD4k= github.com/leanovate/gopter v0.2.9 h1:fQjYxZaynp97ozCzfOyOuAGOU4aU/z37zf/tOujFk7c= github.com/leanovate/gopter v0.2.9/go.mod h1:U2L/78B+KVFIx2VmW6onHJQzXtFb+p5y3y2Sh+Jxxv8= -github.com/ledgerwatch/erigon-lib v0.0.0-20211031023235-7582da6c7866 h1:CNyOjjYS1FElLzHT2HTHtP4swZqaihlkrNmK7yRr2Ok= -github.com/ledgerwatch/erigon-lib v0.0.0-20211031023235-7582da6c7866/go.mod h1:tmLML7kM8BV92RBOUJ4FXmLY/gSqZ8AHW4kkoDQud8k= +github.com/ledgerwatch/erigon-lib v0.0.0-20211101021507-683d16a7a16e h1:NSsCApQHWHMVOWcxLwRCMytPsKZOFOoFhgzw/q6cIro= +github.com/ledgerwatch/erigon-lib v0.0.0-20211101021507-683d16a7a16e/go.mod h1:tmLML7kM8BV92RBOUJ4FXmLY/gSqZ8AHW4kkoDQud8k= github.com/ledgerwatch/log/v3 v3.4.0 h1:SEIOcv5a2zkG3PmoT5jeTU9m/0nEUv0BJS5bzsjwKCI= github.com/ledgerwatch/log/v3 v3.4.0/go.mod h1:VXcz6Ssn6XEeU92dCMc39/g1F0OYAjw1Mt+dGP5DjXY= github.com/ledgerwatch/secp256k1 v0.0.0-20210626115225-cd5cd00ed72d h1:/IKMrJdfRsoYNc36PXqP4xMH3vhW/8IQyBKGQbKZUno=