更新

唐旭辉
go.mod
main.go
pkg/application/factory/dao.go
pkg/application/syncOrder/command/sync_bestshop.go
pkg/application/syncOrder/service/sync_order.go
pkg/infrastructure/dao/pg_order_bestshop.go
pkg/port/consumer/configs/config.go
pkg/port/consumer/consumer.go
pkg/port/consumer/topic_handle_router.go
pkg/port/consumer/topic_handles.go
vendor/github.com/DataDog/zstd/.travis.yml
vendor/github.com/DataDog/zstd/LICENSE
vendor/github.com/DataDog/zstd/README.md
vendor/github.com/DataDog/zstd/ZSTD_LICENSE
vendor/github.com/DataDog/zstd/bitstream.h
vendor/github.com/DataDog/zstd/compiler.h
vendor/github.com/DataDog/zstd/cover.c
vendor/github.com/DataDog/zstd/cover.h
vendor/github.com/DataDog/zstd/cpu.h
vendor/github.com/DataDog/zstd/debug.c
--- a/go.mod
查看文件 @4f5343b
+++ b/go.mod
查看文件 @4f5343b
@@ -4,6 +4,7 @@ go 1.14
 
 require (
 	github.com/GeeTeam/gt3-golang-sdk v0.0.0-20200116043922-446ca8a507d2
+ 	github.com/Shopify/sarama v1.23.1
 	github.com/ajg/form v1.5.1 // indirect
 	github.com/astaxie/beego v1.12.2
 	github.com/dgrijalva/jwt-go v3.2.0+incompatible
--- a/main.go
查看文件 @4f5343b
+++ b/main.go
查看文件 @4f5343b
 package main
 
 import (
+ 	"context"
+ 	"fmt"
+ 	"os"
+ 	"os/signal"
+ 	"syscall"
+ 
 	"github.com/astaxie/beego"
 	"github.com/astaxie/beego/logs"
 	_ "gitlab.fjmaimaimai.com/mmm-go/partnermg/pkg/infrastructure/pg"
 	_ "gitlab.fjmaimaimai.com/mmm-go/partnermg/pkg/log"
 	_ "gitlab.fjmaimaimai.com/mmm-go/partnermg/pkg/port/beego"
+ 	"gitlab.fjmaimaimai.com/mmm-go/partnermg/pkg/port/consumer"
 )
 
 func main() {
+ 	sigs := make(chan os.Signal, 1)
+ 	signal.Notify(sigs, os.Interrupt, os.Kill, syscall.SIGINT, syscall.SIGTERM)
+ 	ctx, cancel := context.WithCancel(context.Background())
+ 	closeConsumer, err := consumer.StartConsumer(ctx)
+ 	if err != nil {
+ 		fmt.Printf("启动kafka消息消费者失败 err%s \n", err)
+ 		logs.Error("启动kafka消息消费者失败:%s", err)
+ 		return
+ 	}
+ 	go func() {
+ 		select {
+ 		case <-sigs:
+ 			cancel()
+ 			closeConsumer()
+ 		}
+ 	}()
+ 
 	logs.Info("应用启动")
 	beego.Run()
 }
--- a/pkg/application/factory/dao.go
查看文件 @4f5343b
+++ b/pkg/application/factory/dao.go
查看文件 @4f5343b
@@ -21,6 +21,14 @@ func CreateOrderBaseDao(options map[string]interface{}) (*dao.OrderBaseDao, erro
 	return dao.NewOrderBaseDao(transactionContext)
 }
 
+ func CreateOrderBestshopDao(options map[string]interface{}) (*dao.OrderBestshopDao, error) {
+ 	var transactionContext *transaction.TransactionContext
+ 	if value, ok := options["transactionContext"]; ok {
+ 		transactionContext = value.(*transaction.TransactionContext)
+ 	}
+ 	return dao.NewOrderBestshopDao(transactionContext)
+ }
+ 
 func CreateUsersDao(options map[string]interface{}) (*dao.UsersDao, error) {
 	var transactionContext *transaction.TransactionContext
 	if value, ok := options["transactionContext"]; ok {
--- a/pkg/application/syncOrder/command/sync_bestshop.go
查看文件 @4f5343b
+++ b/pkg/application/syncOrder/command/sync_bestshop.go
查看文件 @4f5343b
@@ -8,6 +8,8 @@ type CreateOrderFromBestshop struct {
 	OrderCode string `json:"orderCode"`
 	//下单时间
 	OrderTime string `json:"orderTime"`
+ 	//公司id
+ 	CompanyId int64 `json:"companyId"`
 	//订单状态
 	OrderState int8 `json:"orderState"`
 	//发货状态
--- a/pkg/application/syncOrder/service/sync_order.go
查看文件 @4f5343b
+++ b/pkg/application/syncOrder/service/sync_order.go
查看文件 @4f5343b
@@ -4,6 +4,8 @@ import (
 	"fmt"
 	"time"
 
+ 	"gitlab.fjmaimaimai.com/mmm-go/partnermg/pkg/infrastructure/dao"
+ 
 	"github.com/astaxie/beego/logs"
 
 	"gitlab.fjmaimaimai.com/mmm-go/partnermg/pkg/application/factory"
@@ -37,6 +39,25 @@ func (s SyncOrderService) SyncOrderFromBestshop(cmd command.CreateOrderFromBests
 	defer func() {
 		transactionContext.RollbackTransaction()
 	}()
+ 
+ 	//检查账号是否存在
+ 	var (
+ 		orderBestshopDao *dao.OrderBestshopDao
+ 	)
+ 	if orderBestshopDao, err = factory.CreateOrderBestshopDao(map[string]interface{}{
+ 		"transactionContext": transactionContext,
+ 	}); err != nil {
+ 		return lib.ThrowError(lib.TRANSACTION_ERROR, err.Error())
+ 	}
+ 	ok, err := orderBestshopDao.OrderExist(cmd.OrderCode)
+ 	if err != nil {
+ 		return lib.ThrowError(lib.TRANSACTION_ERROR, err.Error())
+ 	}
+ 	if ok {
+ 		logs.Info("订单已存在，order_code=%s", cmd.OrderCode)
+ 		return nil
+ 	}
+ 
 	var (
 		orderBestshopRepository     domain.OrderBestshopRepository
 		orderGoodBestshopRepository domain.OrderGoodBestshopRepository
@@ -173,11 +194,25 @@ func (s SyncOrderService) copyOrderBestshopToOrderBase(orderBestshop *domain.Ord
 		ordergoods []domain.OrderGood
 	)
 	//TODO 添加orderBase
+ 	orderBestshop.CopyToOrderBase(&orderbase)
+ 	orderbase.CompanyId = companyData.Id
+ 	for i := range orderBestshop.Goods {
+ 		good := domain.NewOrderGood()
+ 		orderBestshop.Goods[i].CopyToOrderGood(&good)
+ 		good.OrderId = orderbase.Id
+ 		good.Compute()
+ 		ordergoods = append(ordergoods, good)
+ 	}
+ 	orderbase.Goods = ordergoods
+ 	orderbase.Compute()
 	err = orderBaseRepository.Save(&orderbase)
 	if err != nil {
 		e := fmt.Sprintf("添加order_base数据失败%s", err)
 		return lib.ThrowError(lib.INTERNAL_SERVER_ERROR, e)
 	}
+ 	for i := range ordergoods {
+ 		ordergoods[i].OrderId = orderbase.Id
+ 	}
 	//TODO 添加goods
 	err = orderGoodRepository.Save(ordergoods)
 	if err != nil {
@@ -185,6 +220,7 @@ func (s SyncOrderService) copyOrderBestshopToOrderBase(orderBestshop *domain.Ord
 		return lib.ThrowError(lib.INTERNAL_SERVER_ERROR, e)
 	}
 	//TODO 更新isCopy
+ 	orderBestshop.IsCopy = true
 	err = orderBestshopRepository.Edit(orderBestshop)
 	if err != nil {
 		return lib.ThrowError(lib.INTERNAL_SERVER_ERROR, err.Error())
--- a/pkg/infrastructure/dao/pg_order_bestshop.go 0 → 100644
查看文件 @4f5343b
+++ b/pkg/infrastructure/dao/pg_order_bestshop.go 0 → 100644
查看文件 @4f5343b
+ package dao
+ 
+ import (
+ 	"fmt"
+ 
+ 	"gitlab.fjmaimaimai.com/mmm-go/partnermg/pkg/infrastructure/pg/models"
+ 	"gitlab.fjmaimaimai.com/mmm-go/partnermg/pkg/infrastructure/pg/transaction"
+ )
+ 
+ type OrderBestshopDao struct {
+ 	transactionContext *transaction.TransactionContext
+ }
+ 
+ func NewOrderBestshopDao(transactionContext *transaction.TransactionContext) (*OrderBestshopDao, error) {
+ 	if transactionContext == nil {
+ 		return nil, fmt.Errorf("transactionContext参数不能为nil")
+ 	} else {
+ 		return &OrderBestshopDao{
+ 			transactionContext: transactionContext,
+ 		}, nil
+ 	}
+ }
+ 
+ func (dao OrderBestshopDao) OrderExist(orderCode string) (bool, error) {
+ 	tx := dao.transactionContext.GetDB()
+ 	m := models.OrderBestshop{}
+ 	query := tx.Model(m).Where("order_code=?", orderCode)
+ 	ok, err := query.Exists()
+ 	return ok, err
+ }
--- a/pkg/port/consumer/configs/config.go 0 → 100644
查看文件 @4f5343b
+++ b/pkg/port/consumer/configs/config.go 0 → 100644
查看文件 @4f5343b
+ package configs
+ 
+ type MqConfig struct {
+ 	Servers    []string `json:"servers"`
+ 	ConsumerId string   `json:"consumerGroup"`
+ }
+ 
+ var Cfg MqConfig
+ 
+ func init() {
+ 	Cfg = MqConfig{
+ 		Servers:    []string{"192.168.190.136:9092"},
+ 		ConsumerId: "partnermg",
+ 	}
+ }
+ 
+ // "",
+ // "106.52.15.41:9092"
--- a/pkg/port/consumer/consumer.go 0 → 100644
查看文件 @4f5343b
+++ b/pkg/port/consumer/consumer.go 0 → 100644
查看文件 @4f5343b
+ package consumer
+ 
+ import (
+ 	"context"
+ 	"errors"
+ 	"sync"
+ 
+ 	"gitlab.fjmaimaimai.com/mmm-go/partnermg/pkg/port/consumer/configs"
+ 
+ 	"github.com/Shopify/sarama"
+ 	"github.com/astaxie/beego/logs"
+ )
+ 
+ //MessageConsumer 消息消费者
+ type MessageConsumer struct {
+ 	ready         chan bool
+ 	kafkaHosts    []string
+ 	groupId       string
+ 	topics        []string
+ 	topicsHandles map[string]TopicHandle
+ }
+ 
+ func NewMessageConsumer() *MessageConsumer {
+ 	topics := []string{}
+ 	for key := range TopicHandleRouters {
+ 		topics = append(topics, key)
+ 	}
+ 	return &MessageConsumer{
+ 		ready:         make(chan bool),
+ 		kafkaHosts:    configs.Cfg.Servers,
+ 		groupId:       configs.Cfg.ConsumerId,
+ 		topicsHandles: TopicHandleRouters,
+ 		topics:        topics,
+ 	}
+ }
+ 
+ //实现对应的接口
+ var _ sarama.ConsumerGroupHandler = (*MessageConsumer)(nil)
+ 
+ func (c *MessageConsumer) Setup(groupSession sarama.ConsumerGroupSession) error {
+ 	close(c.ready)
+ 	return nil
+ }
+ 
+ func (c *MessageConsumer) Cleanup(groupSession sarama.ConsumerGroupSession) error {
+ 	return nil
+ }
+ 
+ func (c *MessageConsumer) ConsumeClaim(groupSession sarama.ConsumerGroupSession,
+ 	groupClaim sarama.ConsumerGroupClaim) error {
+ 	var (
+ 		topicHandle TopicHandle
+ 		err         error
+ 	)
+ 	for message := range groupClaim.Messages() {
+ 		if topicHandle, err = c.FindTopichandle(groupClaim.Topic()); err != nil {
+ 			logs.Error("FindTopichandle err:%s \n", err)
+ 			continue
+ 		}
+ 		if err = topicHandle(message); err != nil {
+ 			logs.Error("Message claimed: kafka消息处理错误 topic =", message.Topic, message.Offset, err)
+ 		}
+ 		groupSession.MarkMessage(message, "")
+ 	}
+ 	return nil
+ }
+ 
+ func (c *MessageConsumer) FindTopichandle(topic string) (TopicHandle, error) {
+ 	if v, ok := c.topicsHandles[topic]; ok {
+ 		return v, nil
+ 	}
+ 	return nil, errors.New("TopicHandle not found")
+ }
+ 
+ //StartConsumer 启动
+ //返回 Consumer关闭方法 和 error
+ func StartConsumer(ctx context.Context) (func(), error) {
+ 	consumer := NewMessageConsumer()
+ 	config := sarama.NewConfig()
+ 	config.Consumer.Group.Rebalance.Strategy = sarama.BalanceStrategyRoundRobin
+ 	config.Consumer.Offsets.Initial = sarama.OffsetNewest
+ 	config.Version = sarama.V0_11_0_2
+ 	consumerGroup, err := sarama.NewConsumerGroup(consumer.kafkaHosts, consumer.groupId, config)
+ 	if err != nil {
+ 		return nil, err
+ 	}
+ 	wg := &sync.WaitGroup{}
+ 	wg.Add(1)
+ 	go func() {
+ 		defer wg.Done()
+ 		for {
+ 			if err := ctx.Err(); err != nil {
+ 				logs.Error("ctx err:%s \n", err)
+ 				return
+ 			}
+ 			if err := consumerGroup.Consume(ctx, consumer.topics, consumer); err != nil {
+ 				logs.Error("consumerGroup err:%s \n", err)
+ 			}
+ 		}
+ 	}()
+ 	//等待 consumerGroup 设置完成
+ 	<-consumer.ready
+ 	logs.Error("Sarama consumer up and running!...")
+ 	return func() {
+ 		wg.Wait()
+ 		if err := consumerGroup.Close(); err != nil {
+ 			logs.Error("consumerGroup.Close err %s", err)
+ 		}
+ 		logs.Info("consumerGroup.Close")
+ 	}, nil
+ }
--- a/pkg/port/consumer/topic_handle_router.go 0 → 100644
查看文件 @4f5343b
+++ b/pkg/port/consumer/topic_handle_router.go 0 → 100644
查看文件 @4f5343b
+ package consumer
+ 
+ import (
+ 	"fmt"
+ 
+ 	"github.com/Shopify/sarama"
+ )
+ 
+ //TopicHandle 处理kafka中得消息
+ type TopicHandle func(*sarama.ConsumerMessage) error
+ 
+ //TopicHandleRouters 根据topic区分消息并进行处理
+ var TopicHandleRouters = map[string]TopicHandle{
+ 	"topic_test": func(message *sarama.ConsumerMessage) error {
+ 		fmt.Printf("Done Message claimed:  timestamp = %v, topic = %s offset = %v value = %v \n",
+ 			message.Timestamp, message.Topic, message.Offset, string(message.Value))
+ 		return nil
+ 	},
+ 	"bestshop_order": SyncBestshopOrder,
+ }
--- a/pkg/port/consumer/topic_handles.go 0 → 100644
查看文件 @4f5343b
+++ b/pkg/port/consumer/topic_handles.go 0 → 100644
查看文件 @4f5343b
+ package consumer
+ 
+ import (
+ 	"encoding/json"
+ 	"fmt"
+ 
+ 	"github.com/Shopify/sarama"
+ 	"github.com/astaxie/beego/logs"
+ 	syncOrderCmd "gitlab.fjmaimaimai.com/mmm-go/partnermg/pkg/application/syncOrder/command"
+ 	syncOrderSrv "gitlab.fjmaimaimai.com/mmm-go/partnermg/pkg/application/syncOrder/service"
+ )
+ 
+ //SyncBestshopOrder 同步
+ func SyncBestshopOrder(message *sarama.ConsumerMessage) error {
+ 	logs.Info("Done Message claimed:  timestamp = %v, topic = %s offset = %v value = %v \n",
+ 		message.Timestamp, message.Topic, message.Offset, string(message.Value))
+ 	var (
+ 		cmd syncOrderCmd.CreateOrderFromBestshop
+ 		err error
+ 	)
+ 	err = json.Unmarshal(message.Value, &cmd)
+ 	if err != nil {
+ 		return fmt.Errorf("[SyncBestshopOrder] 解析kafka数据失败；%s", err)
+ 	}
+ 	if cmd.PartnerId <= 0 {
+ 		logs.Info("[SyncBestshopOrder] PartnerId<=0 ,不处理消息")
+ 		return nil
+ 	}
+ 	srv := syncOrderSrv.NewOrderInfoService(nil)
+ 	err = srv.SyncOrderFromBestshop(cmd)
+ 	return err
+ }
--- a/vendor/github.com/DataDog/zstd/.travis.yml 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/.travis.yml 0 → 100644
查看文件 @4f5343b
+ dist: xenial
+ language: go
+ 
+ go:
+   - 1.10.x
+   - 1.11.x
+   - 1.12.x
+ 
+ os:
+   - linux
+   - osx
+ 
+ matrix:
+   include:
+     name: "Go 1.11.x CentOS 32bits"
+     language: go
+     go: 1.11.x
+     os: linux
+     services:
+       - docker
+     script:
+       # Please update Go version in travis_test_32 as needed
+       - "docker run -i -v \"${PWD}:/zstd\" toopher/centos-i386:centos6 /bin/bash -c \"linux32 --32bit i386 /zstd/travis_test_32.sh\""
+ 
+ install:
+   - "wget https://github.com/DataDog/zstd/files/2246767/mr.zip"
+   - "unzip mr.zip"
+ script:
+   - "go build"
+   - "PAYLOAD=`pwd`/mr go test -v"
+   - "PAYLOAD=`pwd`/mr go test -bench ."
--- a/vendor/github.com/DataDog/zstd/LICENSE 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/LICENSE 0 → 100644
查看文件 @4f5343b
+ Simplified BSD License
+ 
+ Copyright (c) 2016, Datadog <info@datadoghq.com>
+ All rights reserved.
+ 
+ Redistribution and use in source and binary forms, with or without
+ modification, are permitted provided that the following conditions are met:
+ 
+     * Redistributions of source code must retain the above copyright notice,
+       this list of conditions and the following disclaimer.
+     * Redistributions in binary form must reproduce the above copyright notice,
+       this list of conditions and the following disclaimer in the documentation
+       and/or other materials provided with the distribution.
+     * Neither the name of the copyright holder nor the names of its contributors
+       may be used to endorse or promote products derived from this software
+       without specific prior written permission.
+ 
+ THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+ AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+ DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
+ FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+ SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+ CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+ OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
--- a/vendor/github.com/DataDog/zstd/README.md 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/README.md 0 → 100644
查看文件 @4f5343b
+ # Zstd Go Wrapper
+ 
+ [C Zstd Homepage](https://github.com/Cyan4973/zstd)
+ 
+ The current headers and C files are from *v1.3.8* (Commit
+ [470344d](https://github.com/facebook/zstd/releases/tag/v1.3.8)).
+ 
+ ## Usage
+ 
+ There are two main APIs:
+ 
+ * simple Compress/Decompress
+ * streaming API (io.Reader/io.Writer)
+ 
+ The compress/decompress APIs mirror that of lz4, while the streaming API was
+ designed to be a drop-in replacement for zlib.
+ 
+ ### Simple `Compress/Decompress`
+ 
+ 
+ ```go
+ // Compress compresses the byte array given in src and writes it to dst.
+ // If you already have a buffer allocated, you can pass it to prevent allocation
+ // If not, you can pass nil as dst.
+ // If the buffer is too small, it will be reallocated, resized, and returned bu the function
+ // If dst is nil, this will allocate the worst case size (CompressBound(src))
+ Compress(dst, src []byte) ([]byte, error)
+ ```
+ 
+ ```go
+ // CompressLevel is the same as Compress but you can pass another compression level
+ CompressLevel(dst, src []byte, level int) ([]byte, error)
+ ```
+ 
+ ```go
+ // Decompress will decompress your payload into dst.
+ // If you already have a buffer allocated, you can pass it to prevent allocation
+ // If not, you can pass nil as dst (allocates a 4*src size as default).
+ // If the buffer is too small, it will retry 3 times by doubling the dst size
+ // After max retries, it will switch to the slower stream API to be sure to be able
+ // to decompress. Currently switches if compression ratio > 4*2**3=32.
+ Decompress(dst, src []byte) ([]byte, error)
+ ```
+ 
+ ### Stream API
+ 
+ ```go
+ // NewWriter creates a new object that can optionally be initialized with
+ // a precomputed dictionary. If dict is nil, compress without a dictionary.
+ // The dictionary array should not be changed during the use of this object.
+ // You MUST CALL Close() to write the last bytes of a zstd stream and free C objects.
+ NewWriter(w io.Writer) *Writer
+ NewWriterLevel(w io.Writer, level int) *Writer
+ NewWriterLevelDict(w io.Writer, level int, dict []byte) *Writer
+ 
+ // Write compresses the input data and write it to the underlying writer
+ (w *Writer) Write(p []byte) (int, error)
+ 
+ // Close flushes the buffer and frees C zstd objects
+ (w *Writer) Close() error
+ ```
+ 
+ ```go
+ // NewReader returns a new io.ReadCloser that will decompress data from the
+ // underlying reader.  If a dictionary is provided to NewReaderDict, it must
+ // not be modified until Close is called.  It is the caller's responsibility
+ // to call Close, which frees up C objects.
+ NewReader(r io.Reader) io.ReadCloser
+ NewReaderDict(r io.Reader, dict []byte) io.ReadCloser
+ ```
+ 
+ ### Benchmarks (benchmarked with v0.5.0)
+ 
+ The author of Zstd also wrote lz4. Zstd is intended to occupy a speed/ratio
+ level similar to what zlib currently provides.  In our tests, the can always
+ be made to be better than zlib by chosing an appropriate level while still
+ keeping compression and decompression time faster than zlib.
+ 
+ You can run the benchmarks against your own payloads by using the Go benchmarks tool.
+ Just export your payload filepath as the `PAYLOAD` environment variable and run the benchmarks:
+ 
+ ```go
+ go test -bench .
+ ```
+ 
+ Compression of a 7Mb pdf zstd (this wrapper) vs [czlib](https://github.com/DataDog/czlib):
+ ```
+ BenchmarkCompression               5     221056624 ns/op      67.34 MB/s
+ BenchmarkDecompression           100      18370416 ns/op     810.32 MB/s
+ 
+ BenchmarkFzlibCompress             2     610156603 ns/op      24.40 MB/s
+ BenchmarkFzlibDecompress          20      81195246 ns/op     183.33 MB/s
+ ```
+ 
+ Ratio is also better by a margin of ~20%.
+ Compression speed is always better than zlib on all the payloads we tested;
+ However, [czlib](https://github.com/DataDog/czlib) has optimisations that make it
+ faster at decompressiong small payloads:
+ 
+ ```
+ Testing with size: 11... czlib: 8.97 MB/s, zstd: 3.26 MB/s
+ Testing with size: 27... czlib: 23.3 MB/s, zstd: 8.22 MB/s
+ Testing with size: 62... czlib: 31.6 MB/s, zstd: 19.49 MB/s
+ Testing with size: 141... czlib: 74.54 MB/s, zstd: 42.55 MB/s
+ Testing with size: 323... czlib: 155.14 MB/s, zstd: 99.39 MB/s
+ Testing with size: 739... czlib: 235.9 MB/s, zstd: 216.45 MB/s
+ Testing with size: 1689... czlib: 116.45 MB/s, zstd: 345.64 MB/s
+ Testing with size: 3858... czlib: 176.39 MB/s, zstd: 617.56 MB/s
+ Testing with size: 8811... czlib: 254.11 MB/s, zstd: 824.34 MB/s
+ Testing with size: 20121... czlib: 197.43 MB/s, zstd: 1339.11 MB/s
+ Testing with size: 45951... czlib: 201.62 MB/s, zstd: 1951.57 MB/s
+ ```
+ 
+ zstd starts to shine with payloads > 1KB
+ 
+ ### Stability - Current state: STABLE
+ 
+ The C library seems to be pretty stable and according to the author has been tested and fuzzed.
+ 
+ For the Go wrapper, the test cover most usual cases and we have succesfully tested it on all staging and prod data.
--- a/vendor/github.com/DataDog/zstd/ZSTD_LICENSE 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/ZSTD_LICENSE 0 → 100644
查看文件 @4f5343b
+ BSD License
+ 
+ For Zstandard software
+ 
+ Copyright (c) 2016-present, Facebook, Inc. All rights reserved.
+ 
+ Redistribution and use in source and binary forms, with or without modification,
+ are permitted provided that the following conditions are met:
+ 
+  * Redistributions of source code must retain the above copyright notice, this
+    list of conditions and the following disclaimer.
+ 
+  * Redistributions in binary form must reproduce the above copyright notice,
+    this list of conditions and the following disclaimer in the documentation
+    and/or other materials provided with the distribution.
+ 
+  * Neither the name Facebook nor the names of its contributors may be used to
+    endorse or promote products derived from this software without specific
+    prior written permission.
+ 
+ THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+ WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+ DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
+ ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+ (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+ LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
+ ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
--- a/vendor/github.com/DataDog/zstd/bitstream.h 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/bitstream.h 0 → 100644
查看文件 @4f5343b
+ /* ******************************************************************
+    bitstream
+    Part of FSE library
+    Copyright (C) 2013-present, Yann Collet.
+ 
+    BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
+ 
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions are
+    met:
+ 
+        * Redistributions of source code must retain the above copyright
+    notice, this list of conditions and the following disclaimer.
+        * Redistributions in binary form must reproduce the above
+    copyright notice, this list of conditions and the following disclaimer
+    in the documentation and/or other materials provided with the
+    distribution.
+ 
+    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+    "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+    OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+    SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+    LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+    DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+    THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+    (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+    OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ 
+    You can contact the author at :
+    - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
+ ****************************************************************** */
+ #ifndef BITSTREAM_H_MODULE
+ #define BITSTREAM_H_MODULE
+ 
+ #if defined (__cplusplus)
+ extern "C" {
+ #endif
+ 
+ /*
+ *  This API consists of small unitary functions, which must be inlined for best performance.
+ *  Since link-time-optimization is not available for all compilers,
+ *  these functions are defined into a .h to be included.
+ */
+ 
+ /*-****************************************
+ *  Dependencies
+ ******************************************/
+ #include "mem.h"            /* unaligned access routines */
+ #include "debug.h"          /* assert(), DEBUGLOG(), RAWLOG() */
+ #include "error_private.h"  /* error codes and messages */
+ 
+ 
+ /*=========================================
+ *  Target specific
+ =========================================*/
+ #if defined(__BMI__) && defined(__GNUC__)
+ #  include <immintrin.h>   /* support for bextr (experimental) */
+ #endif
+ 
+ #define STREAM_ACCUMULATOR_MIN_32  25
+ #define STREAM_ACCUMULATOR_MIN_64  57
+ #define STREAM_ACCUMULATOR_MIN    ((U32)(MEM_32bits() ? STREAM_ACCUMULATOR_MIN_32 : STREAM_ACCUMULATOR_MIN_64))
+ 
+ 
+ /*-******************************************
+ *  bitStream encoding API (write forward)
+ ********************************************/
+ /* bitStream can mix input from multiple sources.
+  * A critical property of these streams is that they encode and decode in **reverse** direction.
+  * So the first bit sequence you add will be the last to be read, like a LIFO stack.
+  */
+ typedef struct {
+     size_t bitContainer;
+     unsigned bitPos;
+     char*  startPtr;
+     char*  ptr;
+     char*  endPtr;
+ } BIT_CStream_t;
+ 
+ MEM_STATIC size_t BIT_initCStream(BIT_CStream_t* bitC, void* dstBuffer, size_t dstCapacity);
+ MEM_STATIC void   BIT_addBits(BIT_CStream_t* bitC, size_t value, unsigned nbBits);
+ MEM_STATIC void   BIT_flushBits(BIT_CStream_t* bitC);
+ MEM_STATIC size_t BIT_closeCStream(BIT_CStream_t* bitC);
+ 
+ /* Start with initCStream, providing the size of buffer to write into.
+ *  bitStream will never write outside of this buffer.
+ *  `dstCapacity` must be >= sizeof(bitD->bitContainer), otherwise @return will be an error code.
+ *
+ *  bits are first added to a local register.
+ *  Local register is size_t, hence 64-bits on 64-bits systems, or 32-bits on 32-bits systems.
+ *  Writing data into memory is an explicit operation, performed by the flushBits function.
+ *  Hence keep track how many bits are potentially stored into local register to avoid register overflow.
+ *  After a flushBits, a maximum of 7 bits might still be stored into local register.
+ *
+ *  Avoid storing elements of more than 24 bits if you want compatibility with 32-bits bitstream readers.
+ *
+ *  Last operation is to close the bitStream.
+ *  The function returns the final size of CStream in bytes.
+ *  If data couldn't fit into `dstBuffer`, it will return a 0 ( == not storable)
+ */
+ 
+ 
+ /*-********************************************
+ *  bitStream decoding API (read backward)
+ **********************************************/
+ typedef struct {
+     size_t   bitContainer;
+     unsigned bitsConsumed;
+     const char* ptr;
+     const char* start;
+     const char* limitPtr;
+ } BIT_DStream_t;
+ 
+ typedef enum { BIT_DStream_unfinished = 0,
+                BIT_DStream_endOfBuffer = 1,
+                BIT_DStream_completed = 2,
+                BIT_DStream_overflow = 3 } BIT_DStream_status;  /* result of BIT_reloadDStream() */
+                /* 1,2,4,8 would be better for bitmap combinations, but slows down performance a bit ... :( */
+ 
+ MEM_STATIC size_t   BIT_initDStream(BIT_DStream_t* bitD, const void* srcBuffer, size_t srcSize);
+ MEM_STATIC size_t   BIT_readBits(BIT_DStream_t* bitD, unsigned nbBits);
+ MEM_STATIC BIT_DStream_status BIT_reloadDStream(BIT_DStream_t* bitD);
+ MEM_STATIC unsigned BIT_endOfDStream(const BIT_DStream_t* bitD);
+ 
+ 
+ /* Start by invoking BIT_initDStream().
+ *  A chunk of the bitStream is then stored into a local register.
+ *  Local register size is 64-bits on 64-bits systems, 32-bits on 32-bits systems (size_t).
+ *  You can then retrieve bitFields stored into the local register, **in reverse order**.
+ *  Local register is explicitly reloaded from memory by the BIT_reloadDStream() method.
+ *  A reload guarantee a minimum of ((8*sizeof(bitD->bitContainer))-7) bits when its result is BIT_DStream_unfinished.
+ *  Otherwise, it can be less than that, so proceed accordingly.
+ *  Checking if DStream has reached its end can be performed with BIT_endOfDStream().
+ */
+ 
+ 
+ /*-****************************************
+ *  unsafe API
+ ******************************************/
+ MEM_STATIC void BIT_addBitsFast(BIT_CStream_t* bitC, size_t value, unsigned nbBits);
+ /* faster, but works only if value is "clean", meaning all high bits above nbBits are 0 */
+ 
+ MEM_STATIC void BIT_flushBitsFast(BIT_CStream_t* bitC);
+ /* unsafe version; does not check buffer overflow */
+ 
+ MEM_STATIC size_t BIT_readBitsFast(BIT_DStream_t* bitD, unsigned nbBits);
+ /* faster, but works only if nbBits >= 1 */
+ 
+ 
+ 
+ /*-**************************************************************
+ *  Internal functions
+ ****************************************************************/
+ MEM_STATIC unsigned BIT_highbit32 (U32 val)
+ {
+     assert(val != 0);
+     {
+ #   if defined(_MSC_VER)   /* Visual */
+         unsigned long r=0;
+         _BitScanReverse ( &r, val );
+         return (unsigned) r;
+ #   elif defined(__GNUC__) && (__GNUC__ >= 3)   /* Use GCC Intrinsic */
+         return 31 - __builtin_clz (val);
+ #   else   /* Software version */
+         static const unsigned DeBruijnClz[32] = { 0,  9,  1, 10, 13, 21,  2, 29,
+                                                  11, 14, 16, 18, 22, 25,  3, 30,
+                                                   8, 12, 20, 28, 15, 17, 24,  7,
+                                                  19, 27, 23,  6, 26,  5,  4, 31 };
+         U32 v = val;
+         v |= v >> 1;
+         v |= v >> 2;
+         v |= v >> 4;
+         v |= v >> 8;
+         v |= v >> 16;
+         return DeBruijnClz[ (U32) (v * 0x07C4ACDDU) >> 27];
+ #   endif
+     }
+ }
+ 
+ /*=====    Local Constants   =====*/
+ static const unsigned BIT_mask[] = {
+     0,          1,         3,         7,         0xF,       0x1F,
+     0x3F,       0x7F,      0xFF,      0x1FF,     0x3FF,     0x7FF,
+     0xFFF,      0x1FFF,    0x3FFF,    0x7FFF,    0xFFFF,    0x1FFFF,
+     0x3FFFF,    0x7FFFF,   0xFFFFF,   0x1FFFFF,  0x3FFFFF,  0x7FFFFF,
+     0xFFFFFF,   0x1FFFFFF, 0x3FFFFFF, 0x7FFFFFF, 0xFFFFFFF, 0x1FFFFFFF,
+     0x3FFFFFFF, 0x7FFFFFFF}; /* up to 31 bits */
+ #define BIT_MASK_SIZE (sizeof(BIT_mask) / sizeof(BIT_mask[0]))
+ 
+ /*-**************************************************************
+ *  bitStream encoding
+ ****************************************************************/
+ /*! BIT_initCStream() :
+  *  `dstCapacity` must be > sizeof(size_t)
+  *  @return : 0 if success,
+  *            otherwise an error code (can be tested using ERR_isError()) */
+ MEM_STATIC size_t BIT_initCStream(BIT_CStream_t* bitC,
+                                   void* startPtr, size_t dstCapacity)
+ {
+     bitC->bitContainer = 0;
+     bitC->bitPos = 0;
+     bitC->startPtr = (char*)startPtr;
+     bitC->ptr = bitC->startPtr;
+     bitC->endPtr = bitC->startPtr + dstCapacity - sizeof(bitC->bitContainer);
+     if (dstCapacity <= sizeof(bitC->bitContainer)) return ERROR(dstSize_tooSmall);
+     return 0;
+ }
+ 
+ /*! BIT_addBits() :
+  *  can add up to 31 bits into `bitC`.
+  *  Note : does not check for register overflow ! */
+ MEM_STATIC void BIT_addBits(BIT_CStream_t* bitC,
+                             size_t value, unsigned nbBits)
+ {
+     MEM_STATIC_ASSERT(BIT_MASK_SIZE == 32);
+     assert(nbBits < BIT_MASK_SIZE);
+     assert(nbBits + bitC->bitPos < sizeof(bitC->bitContainer) * 8);
+     bitC->bitContainer |= (value & BIT_mask[nbBits]) << bitC->bitPos;
+     bitC->bitPos += nbBits;
+ }
+ 
+ /*! BIT_addBitsFast() :
+  *  works only if `value` is _clean_,
+  *  meaning all high bits above nbBits are 0 */
+ MEM_STATIC void BIT_addBitsFast(BIT_CStream_t* bitC,
+                                 size_t value, unsigned nbBits)
+ {
+     assert((value>>nbBits) == 0);
+     assert(nbBits + bitC->bitPos < sizeof(bitC->bitContainer) * 8);
+     bitC->bitContainer |= value << bitC->bitPos;
+     bitC->bitPos += nbBits;
+ }
+ 
+ /*! BIT_flushBitsFast() :
+  *  assumption : bitContainer has not overflowed
+  *  unsafe version; does not check buffer overflow */
+ MEM_STATIC void BIT_flushBitsFast(BIT_CStream_t* bitC)
+ {
+     size_t const nbBytes = bitC->bitPos >> 3;
+     assert(bitC->bitPos < sizeof(bitC->bitContainer) * 8);
+     MEM_writeLEST(bitC->ptr, bitC->bitContainer);
+     bitC->ptr += nbBytes;
+     assert(bitC->ptr <= bitC->endPtr);
+     bitC->bitPos &= 7;
+     bitC->bitContainer >>= nbBytes*8;
+ }
+ 
+ /*! BIT_flushBits() :
+  *  assumption : bitContainer has not overflowed
+  *  safe version; check for buffer overflow, and prevents it.
+  *  note : does not signal buffer overflow.
+  *  overflow will be revealed later on using BIT_closeCStream() */
+ MEM_STATIC void BIT_flushBits(BIT_CStream_t* bitC)
+ {
+     size_t const nbBytes = bitC->bitPos >> 3;
+     assert(bitC->bitPos < sizeof(bitC->bitContainer) * 8);
+     MEM_writeLEST(bitC->ptr, bitC->bitContainer);
+     bitC->ptr += nbBytes;
+     if (bitC->ptr > bitC->endPtr) bitC->ptr = bitC->endPtr;
+     bitC->bitPos &= 7;
+     bitC->bitContainer >>= nbBytes*8;
+ }
+ 
+ /*! BIT_closeCStream() :
+  *  @return : size of CStream, in bytes,
+  *            or 0 if it could not fit into dstBuffer */
+ MEM_STATIC size_t BIT_closeCStream(BIT_CStream_t* bitC)
+ {
+     BIT_addBitsFast(bitC, 1, 1);   /* endMark */
+     BIT_flushBits(bitC);
+     if (bitC->ptr >= bitC->endPtr) return 0; /* overflow detected */
+     return (bitC->ptr - bitC->startPtr) + (bitC->bitPos > 0);
+ }
+ 
+ 
+ /*-********************************************************
+ *  bitStream decoding
+ **********************************************************/
+ /*! BIT_initDStream() :
+  *  Initialize a BIT_DStream_t.
+  * `bitD` : a pointer to an already allocated BIT_DStream_t structure.
+  * `srcSize` must be the *exact* size of the bitStream, in bytes.
+  * @return : size of stream (== srcSize), or an errorCode if a problem is detected
+  */
+ MEM_STATIC size_t BIT_initDStream(BIT_DStream_t* bitD, const void* srcBuffer, size_t srcSize)
+ {
+     if (srcSize < 1) { memset(bitD, 0, sizeof(*bitD)); return ERROR(srcSize_wrong); }
+ 
+     bitD->start = (const char*)srcBuffer;
+     bitD->limitPtr = bitD->start + sizeof(bitD->bitContainer);
+ 
+     if (srcSize >=  sizeof(bitD->bitContainer)) {  /* normal case */
+         bitD->ptr   = (const char*)srcBuffer + srcSize - sizeof(bitD->bitContainer);
+         bitD->bitContainer = MEM_readLEST(bitD->ptr);
+         { BYTE const lastByte = ((const BYTE*)srcBuffer)[srcSize-1];
+           bitD->bitsConsumed = lastByte ? 8 - BIT_highbit32(lastByte) : 0;  /* ensures bitsConsumed is always set */
+           if (lastByte == 0) return ERROR(GENERIC); /* endMark not present */ }
+     } else {
+         bitD->ptr   = bitD->start;
+         bitD->bitContainer = *(const BYTE*)(bitD->start);
+         switch(srcSize)
+         {
+         case 7: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[6]) << (sizeof(bitD->bitContainer)*8 - 16);
+                 /* fall-through */
+ 
+         case 6: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[5]) << (sizeof(bitD->bitContainer)*8 - 24);
+                 /* fall-through */
+ 
+         case 5: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[4]) << (sizeof(bitD->bitContainer)*8 - 32);
+                 /* fall-through */
+ 
+         case 4: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[3]) << 24;
+                 /* fall-through */
+ 
+         case 3: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[2]) << 16;
+                 /* fall-through */
+ 
+         case 2: bitD->bitContainer += (size_t)(((const BYTE*)(srcBuffer))[1]) <<  8;
+                 /* fall-through */
+ 
+         default: break;
+         }
+         {   BYTE const lastByte = ((const BYTE*)srcBuffer)[srcSize-1];
+             bitD->bitsConsumed = lastByte ? 8 - BIT_highbit32(lastByte) : 0;
+             if (lastByte == 0) return ERROR(corruption_detected);  /* endMark not present */
+         }
+         bitD->bitsConsumed += (U32)(sizeof(bitD->bitContainer) - srcSize)*8;
+     }
+ 
+     return srcSize;
+ }
+ 
+ MEM_STATIC size_t BIT_getUpperBits(size_t bitContainer, U32 const start)
+ {
+     return bitContainer >> start;
+ }
+ 
+ MEM_STATIC size_t BIT_getMiddleBits(size_t bitContainer, U32 const start, U32 const nbBits)
+ {
+     U32 const regMask = sizeof(bitContainer)*8 - 1;
+     /* if start > regMask, bitstream is corrupted, and result is undefined */
+     assert(nbBits < BIT_MASK_SIZE);
+     return (bitContainer >> (start & regMask)) & BIT_mask[nbBits];
+ }
+ 
+ MEM_STATIC size_t BIT_getLowerBits(size_t bitContainer, U32 const nbBits)
+ {
+     assert(nbBits < BIT_MASK_SIZE);
+     return bitContainer & BIT_mask[nbBits];
+ }
+ 
+ /*! BIT_lookBits() :
+  *  Provides next n bits from local register.
+  *  local register is not modified.
+  *  On 32-bits, maxNbBits==24.
+  *  On 64-bits, maxNbBits==56.
+  * @return : value extracted */
+ MEM_STATIC size_t BIT_lookBits(const BIT_DStream_t* bitD, U32 nbBits)
+ {
+     /* arbitrate between double-shift and shift+mask */
+ #if 1
+     /* if bitD->bitsConsumed + nbBits > sizeof(bitD->bitContainer)*8,
+      * bitstream is likely corrupted, and result is undefined */
+     return BIT_getMiddleBits(bitD->bitContainer, (sizeof(bitD->bitContainer)*8) - bitD->bitsConsumed - nbBits, nbBits);
+ #else
+     /* this code path is slower on my os-x laptop */
+     U32 const regMask = sizeof(bitD->bitContainer)*8 - 1;
+     return ((bitD->bitContainer << (bitD->bitsConsumed & regMask)) >> 1) >> ((regMask-nbBits) & regMask);
+ #endif
+ }
+ 
+ /*! BIT_lookBitsFast() :
+  *  unsafe version; only works if nbBits >= 1 */
+ MEM_STATIC size_t BIT_lookBitsFast(const BIT_DStream_t* bitD, U32 nbBits)
+ {
+     U32 const regMask = sizeof(bitD->bitContainer)*8 - 1;
+     assert(nbBits >= 1);
+     return (bitD->bitContainer << (bitD->bitsConsumed & regMask)) >> (((regMask+1)-nbBits) & regMask);
+ }
+ 
+ MEM_STATIC void BIT_skipBits(BIT_DStream_t* bitD, U32 nbBits)
+ {
+     bitD->bitsConsumed += nbBits;
+ }
+ 
+ /*! BIT_readBits() :
+  *  Read (consume) next n bits from local register and update.
+  *  Pay attention to not read more than nbBits contained into local register.
+  * @return : extracted value. */
+ MEM_STATIC size_t BIT_readBits(BIT_DStream_t* bitD, unsigned nbBits)
+ {
+     size_t const value = BIT_lookBits(bitD, nbBits);
+     BIT_skipBits(bitD, nbBits);
+     return value;
+ }
+ 
+ /*! BIT_readBitsFast() :
+  *  unsafe version; only works only if nbBits >= 1 */
+ MEM_STATIC size_t BIT_readBitsFast(BIT_DStream_t* bitD, unsigned nbBits)
+ {
+     size_t const value = BIT_lookBitsFast(bitD, nbBits);
+     assert(nbBits >= 1);
+     BIT_skipBits(bitD, nbBits);
+     return value;
+ }
+ 
+ /*! BIT_reloadDStream() :
+  *  Refill `bitD` from buffer previously set in BIT_initDStream() .
+  *  This function is safe, it guarantees it will not read beyond src buffer.
+  * @return : status of `BIT_DStream_t` internal register.
+  *           when status == BIT_DStream_unfinished, internal register is filled with at least 25 or 57 bits */
+ MEM_STATIC BIT_DStream_status BIT_reloadDStream(BIT_DStream_t* bitD)
+ {
+     if (bitD->bitsConsumed > (sizeof(bitD->bitContainer)*8))  /* overflow detected, like end of stream */
+         return BIT_DStream_overflow;
+ 
+     if (bitD->ptr >= bitD->limitPtr) {
+         bitD->ptr -= bitD->bitsConsumed >> 3;
+         bitD->bitsConsumed &= 7;
+         bitD->bitContainer = MEM_readLEST(bitD->ptr);
+         return BIT_DStream_unfinished;
+     }
+     if (bitD->ptr == bitD->start) {
+         if (bitD->bitsConsumed < sizeof(bitD->bitContainer)*8) return BIT_DStream_endOfBuffer;
+         return BIT_DStream_completed;
+     }
+     /* start < ptr < limitPtr */
+     {   U32 nbBytes = bitD->bitsConsumed >> 3;
+         BIT_DStream_status result = BIT_DStream_unfinished;
+         if (bitD->ptr - nbBytes < bitD->start) {
+             nbBytes = (U32)(bitD->ptr - bitD->start);  /* ptr > start */
+             result = BIT_DStream_endOfBuffer;
+         }
+         bitD->ptr -= nbBytes;
+         bitD->bitsConsumed -= nbBytes*8;
+         bitD->bitContainer = MEM_readLEST(bitD->ptr);   /* reminder : srcSize > sizeof(bitD->bitContainer), otherwise bitD->ptr == bitD->start */
+         return result;
+     }
+ }
+ 
+ /*! BIT_endOfDStream() :
+  * @return : 1 if DStream has _exactly_ reached its end (all bits consumed).
+  */
+ MEM_STATIC unsigned BIT_endOfDStream(const BIT_DStream_t* DStream)
+ {
+     return ((DStream->ptr == DStream->start) && (DStream->bitsConsumed == sizeof(DStream->bitContainer)*8));
+ }
+ 
+ #if defined (__cplusplus)
+ }
+ #endif
+ 
+ #endif /* BITSTREAM_H_MODULE */
--- a/vendor/github.com/DataDog/zstd/compiler.h 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/compiler.h 0 → 100644
查看文件 @4f5343b
+ /*
+  * Copyright (c) 2016-present, Yann Collet, Facebook, Inc.
+  * All rights reserved.
+  *
+  * This source code is licensed under both the BSD-style license (found in the
+  * LICENSE file in the root directory of this source tree) and the GPLv2 (found
+  * in the COPYING file in the root directory of this source tree).
+  * You may select, at your option, one of the above-listed licenses.
+  */
+ 
+ #ifndef ZSTD_COMPILER_H
+ #define ZSTD_COMPILER_H
+ 
+ /*-*******************************************************
+ *  Compiler specifics
+ *********************************************************/
+ /* force inlining */
+ 
+ #if !defined(ZSTD_NO_INLINE)
+ #if defined (__GNUC__) || defined(__cplusplus) || defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L   /* C99 */
+ #  define INLINE_KEYWORD inline
+ #else
+ #  define INLINE_KEYWORD
+ #endif
+ 
+ #if defined(__GNUC__)
+ #  define FORCE_INLINE_ATTR __attribute__((always_inline))
+ #elif defined(_MSC_VER)
+ #  define FORCE_INLINE_ATTR __forceinline
+ #else
+ #  define FORCE_INLINE_ATTR
+ #endif
+ 
+ #else
+ 
+ #define INLINE_KEYWORD
+ #define FORCE_INLINE_ATTR
+ 
+ #endif
+ 
+ /**
+  * FORCE_INLINE_TEMPLATE is used to define C "templates", which take constant
+  * parameters. They must be inlined for the compiler to elimininate the constant
+  * branches.
+  */
+ #define FORCE_INLINE_TEMPLATE static INLINE_KEYWORD FORCE_INLINE_ATTR
+ /**
+  * HINT_INLINE is used to help the compiler generate better code. It is *not*
+  * used for "templates", so it can be tweaked based on the compilers
+  * performance.
+  *
+  * gcc-4.8 and gcc-4.9 have been shown to benefit from leaving off the
+  * always_inline attribute.
+  *
+  * clang up to 5.0.0 (trunk) benefit tremendously from the always_inline
+  * attribute.
+  */
+ #if !defined(__clang__) && defined(__GNUC__) && __GNUC__ >= 4 && __GNUC_MINOR__ >= 8 && __GNUC__ < 5
+ #  define HINT_INLINE static INLINE_KEYWORD
+ #else
+ #  define HINT_INLINE static INLINE_KEYWORD FORCE_INLINE_ATTR
+ #endif
+ 
+ /* force no inlining */
+ #ifdef _MSC_VER
+ #  define FORCE_NOINLINE static __declspec(noinline)
+ #else
+ #  ifdef __GNUC__
+ #    define FORCE_NOINLINE static __attribute__((__noinline__))
+ #  else
+ #    define FORCE_NOINLINE static
+ #  endif
+ #endif
+ 
+ /* target attribute */
+ #ifndef __has_attribute
+   #define __has_attribute(x) 0  /* Compatibility with non-clang compilers. */
+ #endif
+ #if defined(__GNUC__)
+ #  define TARGET_ATTRIBUTE(target) __attribute__((__target__(target)))
+ #else
+ #  define TARGET_ATTRIBUTE(target)
+ #endif
+ 
+ /* Enable runtime BMI2 dispatch based on the CPU.
+  * Enabled for clang & gcc >=4.8 on x86 when BMI2 isn't enabled by default.
+  */
+ #ifndef DYNAMIC_BMI2
+   #if ((defined(__clang__) && __has_attribute(__target__)) \
+       || (defined(__GNUC__) \
+           && (__GNUC__ >= 5 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 8)))) \
+       && (defined(__x86_64__) || defined(_M_X86)) \
+       && !defined(__BMI2__)
+   #  define DYNAMIC_BMI2 1
+   #else
+   #  define DYNAMIC_BMI2 0
+   #endif
+ #endif
+ 
+ /* prefetch
+  * can be disabled, by declaring NO_PREFETCH build macro */
+ #if defined(NO_PREFETCH)
+ #  define PREFETCH_L1(ptr)  (void)(ptr)  /* disabled */
+ #  define PREFETCH_L2(ptr)  (void)(ptr)  /* disabled */
+ #else
+ #  if defined(_MSC_VER) && (defined(_M_X64) || defined(_M_I86))  /* _mm_prefetch() is not defined outside of x86/x64 */
+ #    include <mmintrin.h>   /* https://msdn.microsoft.com/fr-fr/library/84szxsww(v=vs.90).aspx */
+ #    define PREFETCH_L1(ptr)  _mm_prefetch((const char*)(ptr), _MM_HINT_T0)
+ #    define PREFETCH_L2(ptr)  _mm_prefetch((const char*)(ptr), _MM_HINT_T1)
+ #  elif defined(__GNUC__) && ( (__GNUC__ >= 4) || ( (__GNUC__ == 3) && (__GNUC_MINOR__ >= 1) ) )
+ #    define PREFETCH_L1(ptr)  __builtin_prefetch((ptr), 0 /* rw==read */, 3 /* locality */)
+ #    define PREFETCH_L2(ptr)  __builtin_prefetch((ptr), 0 /* rw==read */, 2 /* locality */)
+ #  else
+ #    define PREFETCH_L1(ptr) (void)(ptr)  /* disabled */
+ #    define PREFETCH_L2(ptr) (void)(ptr)  /* disabled */
+ #  endif
+ #endif  /* NO_PREFETCH */
+ 
+ #define CACHELINE_SIZE 64
+ 
+ #define PREFETCH_AREA(p, s)  {            \
+     const char* const _ptr = (const char*)(p);  \
+     size_t const _size = (size_t)(s);     \
+     size_t _pos;                          \
+     for (_pos=0; _pos<_size; _pos+=CACHELINE_SIZE) {  \
+         PREFETCH_L2(_ptr + _pos);         \
+     }                                     \
+ }
+ 
+ /* disable warnings */
+ #ifdef _MSC_VER    /* Visual Studio */
+ #  include <intrin.h>                    /* For Visual 2005 */
+ #  pragma warning(disable : 4100)        /* disable: C4100: unreferenced formal parameter */
+ #  pragma warning(disable : 4127)        /* disable: C4127: conditional expression is constant */
+ #  pragma warning(disable : 4204)        /* disable: C4204: non-constant aggregate initializer */
+ #  pragma warning(disable : 4214)        /* disable: C4214: non-int bitfields */
+ #  pragma warning(disable : 4324)        /* disable: C4324: padded structure */
+ #endif
+ 
+ #endif /* ZSTD_COMPILER_H */
--- a/vendor/github.com/DataDog/zstd/cover.c 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/cover.c 0 → 100644
查看文件 @4f5343b
+ /*
+  * Copyright (c) 2016-present, Yann Collet, Facebook, Inc.
+  * All rights reserved.
+  *
+  * This source code is licensed under both the BSD-style license (found in the
+  * LICENSE file in the root directory of this source tree) and the GPLv2 (found
+  * in the COPYING file in the root directory of this source tree).
+  * You may select, at your option, one of the above-listed licenses.
+  */
+ 
+ /* *****************************************************************************
+  * Constructs a dictionary using a heuristic based on the following paper:
+  *
+  * Liao, Petri, Moffat, Wirth
+  * Effective Construction of Relative Lempel-Ziv Dictionaries
+  * Published in WWW 2016.
+  *
+  * Adapted from code originally written by @ot (Giuseppe Ottaviano).
+  ******************************************************************************/
+ 
+ /*-*************************************
+ *  Dependencies
+ ***************************************/
+ #include <stdio.h>  /* fprintf */
+ #include <stdlib.h> /* malloc, free, qsort */
+ #include <string.h> /* memset */
+ #include <time.h>   /* clock */
+ 
+ #include "mem.h" /* read */
+ #include "pool.h"
+ #include "threading.h"
+ #include "cover.h"
+ #include "zstd_internal.h" /* includes zstd.h */
+ #ifndef ZDICT_STATIC_LINKING_ONLY
+ #define ZDICT_STATIC_LINKING_ONLY
+ #endif
+ #include "zdict.h"
+ 
+ /*-*************************************
+ *  Constants
+ ***************************************/
+ #define COVER_MAX_SAMPLES_SIZE (sizeof(size_t) == 8 ? ((unsigned)-1) : ((unsigned)1 GB))
+ #define DEFAULT_SPLITPOINT 1.0
+ 
+ /*-*************************************
+ *  Console display
+ ***************************************/
+ static int g_displayLevel = 2;
+ #define DISPLAY(...)                                                           \
+   {                                                                            \
+     fprintf(stderr, __VA_ARGS__);                                              \
+     fflush(stderr);                                                            \
+   }
+ #define LOCALDISPLAYLEVEL(displayLevel, l, ...)                                \
+   if (displayLevel >= l) {                                                     \
+     DISPLAY(__VA_ARGS__);                                                      \
+   } /* 0 : no display;   1: errors;   2: default;  3: details;  4: debug */
+ #define DISPLAYLEVEL(l, ...) LOCALDISPLAYLEVEL(g_displayLevel, l, __VA_ARGS__)
+ 
+ #define LOCALDISPLAYUPDATE(displayLevel, l, ...)                               \
+   if (displayLevel >= l) {                                                     \
+     if ((clock() - g_time > refreshRate) || (displayLevel >= 4)) {             \
+       g_time = clock();                                                        \
+       DISPLAY(__VA_ARGS__);                                                    \
+     }                                                                          \
+   }
+ #define DISPLAYUPDATE(l, ...) LOCALDISPLAYUPDATE(g_displayLevel, l, __VA_ARGS__)
+ static const clock_t refreshRate = CLOCKS_PER_SEC * 15 / 100;
+ static clock_t g_time = 0;
+ 
+ /*-*************************************
+ * Hash table
+ ***************************************
+ * A small specialized hash map for storing activeDmers.
+ * The map does not resize, so if it becomes full it will loop forever.
+ * Thus, the map must be large enough to store every value.
+ * The map implements linear probing and keeps its load less than 0.5.
+ */
+ 
+ #define MAP_EMPTY_VALUE ((U32)-1)
+ typedef struct COVER_map_pair_t_s {
+   U32 key;
+   U32 value;
+ } COVER_map_pair_t;
+ 
+ typedef struct COVER_map_s {
+   COVER_map_pair_t *data;
+   U32 sizeLog;
+   U32 size;
+   U32 sizeMask;
+ } COVER_map_t;
+ 
+ /**
+  * Clear the map.
+  */
+ static void COVER_map_clear(COVER_map_t *map) {
+   memset(map->data, MAP_EMPTY_VALUE, map->size * sizeof(COVER_map_pair_t));
+ }
+ 
+ /**
+  * Initializes a map of the given size.
+  * Returns 1 on success and 0 on failure.
+  * The map must be destroyed with COVER_map_destroy().
+  * The map is only guaranteed to be large enough to hold size elements.
+  */
+ static int COVER_map_init(COVER_map_t *map, U32 size) {
+   map->sizeLog = ZSTD_highbit32(size) + 2;
+   map->size = (U32)1 << map->sizeLog;
+   map->sizeMask = map->size - 1;
+   map->data = (COVER_map_pair_t *)malloc(map->size * sizeof(COVER_map_pair_t));
+   if (!map->data) {
+     map->sizeLog = 0;
+     map->size = 0;
+     return 0;
+   }
+   COVER_map_clear(map);
+   return 1;
+ }
+ 
+ /**
+  * Internal hash function
+  */
+ static const U32 prime4bytes = 2654435761U;
+ static U32 COVER_map_hash(COVER_map_t *map, U32 key) {
+   return (key * prime4bytes) >> (32 - map->sizeLog);
+ }
+ 
+ /**
+  * Helper function that returns the index that a key should be placed into.
+  */
+ static U32 COVER_map_index(COVER_map_t *map, U32 key) {
+   const U32 hash = COVER_map_hash(map, key);
+   U32 i;
+   for (i = hash;; i = (i + 1) & map->sizeMask) {
+     COVER_map_pair_t *pos = &map->data[i];
+     if (pos->value == MAP_EMPTY_VALUE) {
+       return i;
+     }
+     if (pos->key == key) {
+       return i;
+     }
+   }
+ }
+ 
+ /**
+  * Returns the pointer to the value for key.
+  * If key is not in the map, it is inserted and the value is set to 0.
+  * The map must not be full.
+  */
+ static U32 *COVER_map_at(COVER_map_t *map, U32 key) {
+   COVER_map_pair_t *pos = &map->data[COVER_map_index(map, key)];
+   if (pos->value == MAP_EMPTY_VALUE) {
+     pos->key = key;
+     pos->value = 0;
+   }
+   return &pos->value;
+ }
+ 
+ /**
+  * Deletes key from the map if present.
+  */
+ static void COVER_map_remove(COVER_map_t *map, U32 key) {
+   U32 i = COVER_map_index(map, key);
+   COVER_map_pair_t *del = &map->data[i];
+   U32 shift = 1;
+   if (del->value == MAP_EMPTY_VALUE) {
+     return;
+   }
+   for (i = (i + 1) & map->sizeMask;; i = (i + 1) & map->sizeMask) {
+     COVER_map_pair_t *const pos = &map->data[i];
+     /* If the position is empty we are done */
+     if (pos->value == MAP_EMPTY_VALUE) {
+       del->value = MAP_EMPTY_VALUE;
+       return;
+     }
+     /* If pos can be moved to del do so */
+     if (((i - COVER_map_hash(map, pos->key)) & map->sizeMask) >= shift) {
+       del->key = pos->key;
+       del->value = pos->value;
+       del = pos;
+       shift = 1;
+     } else {
+       ++shift;
+     }
+   }
+ }
+ 
+ /**
+  * Destroys a map that is inited with COVER_map_init().
+  */
+ static void COVER_map_destroy(COVER_map_t *map) {
+   if (map->data) {
+     free(map->data);
+   }
+   map->data = NULL;
+   map->size = 0;
+ }
+ 
+ /*-*************************************
+ * Context
+ ***************************************/
+ 
+ typedef struct {
+   const BYTE *samples;
+   size_t *offsets;
+   const size_t *samplesSizes;
+   size_t nbSamples;
+   size_t nbTrainSamples;
+   size_t nbTestSamples;
+   U32 *suffix;
+   size_t suffixSize;
+   U32 *freqs;
+   U32 *dmerAt;
+   unsigned d;
+ } COVER_ctx_t;
+ 
+ /* We need a global context for qsort... */
+ static COVER_ctx_t *g_ctx = NULL;
+ 
+ /*-*************************************
+ *  Helper functions
+ ***************************************/
+ 
+ /**
+  * Returns the sum of the sample sizes.
+  */
+ size_t COVER_sum(const size_t *samplesSizes, unsigned nbSamples) {
+   size_t sum = 0;
+   unsigned i;
+   for (i = 0; i < nbSamples; ++i) {
+     sum += samplesSizes[i];
+   }
+   return sum;
+ }
+ 
+ /**
+  * Returns -1 if the dmer at lp is less than the dmer at rp.
+  * Return 0 if the dmers at lp and rp are equal.
+  * Returns 1 if the dmer at lp is greater than the dmer at rp.
+  */
+ static int COVER_cmp(COVER_ctx_t *ctx, const void *lp, const void *rp) {
+   U32 const lhs = *(U32 const *)lp;
+   U32 const rhs = *(U32 const *)rp;
+   return memcmp(ctx->samples + lhs, ctx->samples + rhs, ctx->d);
+ }
+ /**
+  * Faster version for d <= 8.
+  */
+ static int COVER_cmp8(COVER_ctx_t *ctx, const void *lp, const void *rp) {
+   U64 const mask = (ctx->d == 8) ? (U64)-1 : (((U64)1 << (8 * ctx->d)) - 1);
+   U64 const lhs = MEM_readLE64(ctx->samples + *(U32 const *)lp) & mask;
+   U64 const rhs = MEM_readLE64(ctx->samples + *(U32 const *)rp) & mask;
+   if (lhs < rhs) {
+     return -1;
+   }
+   return (lhs > rhs);
+ }
+ 
+ /**
+  * Same as COVER_cmp() except ties are broken by pointer value
+  * NOTE: g_ctx must be set to call this function.  A global is required because
+  * qsort doesn't take an opaque pointer.
+  */
+ static int COVER_strict_cmp(const void *lp, const void *rp) {
+   int result = COVER_cmp(g_ctx, lp, rp);
+   if (result == 0) {
+     result = lp < rp ? -1 : 1;
+   }
+   return result;
+ }
+ /**
+  * Faster version for d <= 8.
+  */
+ static int COVER_strict_cmp8(const void *lp, const void *rp) {
+   int result = COVER_cmp8(g_ctx, lp, rp);
+   if (result == 0) {
+     result = lp < rp ? -1 : 1;
+   }
+   return result;
+ }
+ 
+ /**
+  * Returns the first pointer in [first, last) whose element does not compare
+  * less than value.  If no such element exists it returns last.
+  */
+ static const size_t *COVER_lower_bound(const size_t *first, const size_t *last,
+                                        size_t value) {
+   size_t count = last - first;
+   while (count != 0) {
+     size_t step = count / 2;
+     const size_t *ptr = first;
+     ptr += step;
+     if (*ptr < value) {
+       first = ++ptr;
+       count -= step + 1;
+     } else {
+       count = step;
+     }
+   }
+   return first;
+ }
+ 
+ /**
+  * Generic groupBy function.
+  * Groups an array sorted by cmp into groups with equivalent values.
+  * Calls grp for each group.
+  */
+ static void
+ COVER_groupBy(const void *data, size_t count, size_t size, COVER_ctx_t *ctx,
+               int (*cmp)(COVER_ctx_t *, const void *, const void *),
+               void (*grp)(COVER_ctx_t *, const void *, const void *)) {
+   const BYTE *ptr = (const BYTE *)data;
+   size_t num = 0;
+   while (num < count) {
+     const BYTE *grpEnd = ptr + size;
+     ++num;
+     while (num < count && cmp(ctx, ptr, grpEnd) == 0) {
+       grpEnd += size;
+       ++num;
+     }
+     grp(ctx, ptr, grpEnd);
+     ptr = grpEnd;
+   }
+ }
+ 
+ /*-*************************************
+ *  Cover functions
+ ***************************************/
+ 
+ /**
+  * Called on each group of positions with the same dmer.
+  * Counts the frequency of each dmer and saves it in the suffix array.
+  * Fills `ctx->dmerAt`.
+  */
+ static void COVER_group(COVER_ctx_t *ctx, const void *group,
+                         const void *groupEnd) {
+   /* The group consists of all the positions with the same first d bytes. */
+   const U32 *grpPtr = (const U32 *)group;
+   const U32 *grpEnd = (const U32 *)groupEnd;
+   /* The dmerId is how we will reference this dmer.
+    * This allows us to map the whole dmer space to a much smaller space, the
+    * size of the suffix array.
+    */
+   const U32 dmerId = (U32)(grpPtr - ctx->suffix);
+   /* Count the number of samples this dmer shows up in */
+   U32 freq = 0;
+   /* Details */
+   const size_t *curOffsetPtr = ctx->offsets;
+   const size_t *offsetsEnd = ctx->offsets + ctx->nbSamples;
+   /* Once *grpPtr >= curSampleEnd this occurrence of the dmer is in a
+    * different sample than the last.
+    */
+   size_t curSampleEnd = ctx->offsets[0];
+   for (; grpPtr != grpEnd; ++grpPtr) {
+     /* Save the dmerId for this position so we can get back to it. */
+     ctx->dmerAt[*grpPtr] = dmerId;
+     /* Dictionaries only help for the first reference to the dmer.
+      * After that zstd can reference the match from the previous reference.
+      * So only count each dmer once for each sample it is in.
+      */
+     if (*grpPtr < curSampleEnd) {
+       continue;
+     }
+     freq += 1;
+     /* Binary search to find the end of the sample *grpPtr is in.
+      * In the common case that grpPtr + 1 == grpEnd we can skip the binary
+      * search because the loop is over.
+      */
+     if (grpPtr + 1 != grpEnd) {
+       const size_t *sampleEndPtr =
+           COVER_lower_bound(curOffsetPtr, offsetsEnd, *grpPtr);
+       curSampleEnd = *sampleEndPtr;
+       curOffsetPtr = sampleEndPtr + 1;
+     }
+   }
+   /* At this point we are never going to look at this segment of the suffix
+    * array again.  We take advantage of this fact to save memory.
+    * We store the frequency of the dmer in the first position of the group,
+    * which is dmerId.
+    */
+   ctx->suffix[dmerId] = freq;
+ }
+ 
+ 
+ /**
+  * Selects the best segment in an epoch.
+  * Segments of are scored according to the function:
+  *
+  * Let F(d) be the frequency of dmer d.
+  * Let S_i be the dmer at position i of segment S which has length k.
+  *
+  *     Score(S) = F(S_1) + F(S_2) + ... + F(S_{k-d+1})
+  *
+  * Once the dmer d is in the dictionay we set F(d) = 0.
+  */
+ static COVER_segment_t COVER_selectSegment(const COVER_ctx_t *ctx, U32 *freqs,
+                                            COVER_map_t *activeDmers, U32 begin,
+                                            U32 end,
+                                            ZDICT_cover_params_t parameters) {
+   /* Constants */
+   const U32 k = parameters.k;
+   const U32 d = parameters.d;
+   const U32 dmersInK = k - d + 1;
+   /* Try each segment (activeSegment) and save the best (bestSegment) */
+   COVER_segment_t bestSegment = {0, 0, 0};
+   COVER_segment_t activeSegment;
+   /* Reset the activeDmers in the segment */
+   COVER_map_clear(activeDmers);
+   /* The activeSegment starts at the beginning of the epoch. */
+   activeSegment.begin = begin;
+   activeSegment.end = begin;
+   activeSegment.score = 0;
+   /* Slide the activeSegment through the whole epoch.
+    * Save the best segment in bestSegment.
+    */
+   while (activeSegment.end < end) {
+     /* The dmerId for the dmer at the next position */
+     U32 newDmer = ctx->dmerAt[activeSegment.end];
+     /* The entry in activeDmers for this dmerId */
+     U32 *newDmerOcc = COVER_map_at(activeDmers, newDmer);
+     /* If the dmer isn't already present in the segment add its score. */
+     if (*newDmerOcc == 0) {
+       /* The paper suggest using the L-0.5 norm, but experiments show that it
+        * doesn't help.
+        */
+       activeSegment.score += freqs[newDmer];
+     }
+     /* Add the dmer to the segment */
+     activeSegment.end += 1;
+     *newDmerOcc += 1;
+ 
+     /* If the window is now too large, drop the first position */
+     if (activeSegment.end - activeSegment.begin == dmersInK + 1) {
+       U32 delDmer = ctx->dmerAt[activeSegment.begin];
+       U32 *delDmerOcc = COVER_map_at(activeDmers, delDmer);
+       activeSegment.begin += 1;
+       *delDmerOcc -= 1;
+       /* If this is the last occurence of the dmer, subtract its score */
+       if (*delDmerOcc == 0) {
+         COVER_map_remove(activeDmers, delDmer);
+         activeSegment.score -= freqs[delDmer];
+       }
+     }
+ 
+     /* If this segment is the best so far save it */
+     if (activeSegment.score > bestSegment.score) {
+       bestSegment = activeSegment;
+     }
+   }
+   {
+     /* Trim off the zero frequency head and tail from the segment. */
+     U32 newBegin = bestSegment.end;
+     U32 newEnd = bestSegment.begin;
+     U32 pos;
+     for (pos = bestSegment.begin; pos != bestSegment.end; ++pos) {
+       U32 freq = freqs[ctx->dmerAt[pos]];
+       if (freq != 0) {
+         newBegin = MIN(newBegin, pos);
+         newEnd = pos + 1;
+       }
+     }
+     bestSegment.begin = newBegin;
+     bestSegment.end = newEnd;
+   }
+   {
+     /* Zero out the frequency of each dmer covered by the chosen segment. */
+     U32 pos;
+     for (pos = bestSegment.begin; pos != bestSegment.end; ++pos) {
+       freqs[ctx->dmerAt[pos]] = 0;
+     }
+   }
+   return bestSegment;
+ }
+ 
+ /**
+  * Check the validity of the parameters.
+  * Returns non-zero if the parameters are valid and 0 otherwise.
+  */
+ static int COVER_checkParameters(ZDICT_cover_params_t parameters,
+                                  size_t maxDictSize) {
+   /* k and d are required parameters */
+   if (parameters.d == 0 || parameters.k == 0) {
+     return 0;
+   }
+   /* k <= maxDictSize */
+   if (parameters.k > maxDictSize) {
+     return 0;
+   }
+   /* d <= k */
+   if (parameters.d > parameters.k) {
+     return 0;
+   }
+   /* 0 < splitPoint <= 1 */
+   if (parameters.splitPoint <= 0 || parameters.splitPoint > 1){
+     return 0;
+   }
+   return 1;
+ }
+ 
+ /**
+  * Clean up a context initialized with `COVER_ctx_init()`.
+  */
+ static void COVER_ctx_destroy(COVER_ctx_t *ctx) {
+   if (!ctx) {
+     return;
+   }
+   if (ctx->suffix) {
+     free(ctx->suffix);
+     ctx->suffix = NULL;
+   }
+   if (ctx->freqs) {
+     free(ctx->freqs);
+     ctx->freqs = NULL;
+   }
+   if (ctx->dmerAt) {
+     free(ctx->dmerAt);
+     ctx->dmerAt = NULL;
+   }
+   if (ctx->offsets) {
+     free(ctx->offsets);
+     ctx->offsets = NULL;
+   }
+ }
+ 
+ /**
+  * Prepare a context for dictionary building.
+  * The context is only dependent on the parameter `d` and can used multiple
+  * times.
+  * Returns 1 on success or zero on error.
+  * The context must be destroyed with `COVER_ctx_destroy()`.
+  */
+ static int COVER_ctx_init(COVER_ctx_t *ctx, const void *samplesBuffer,
+                           const size_t *samplesSizes, unsigned nbSamples,
+                           unsigned d, double splitPoint) {
+   const BYTE *const samples = (const BYTE *)samplesBuffer;
+   const size_t totalSamplesSize = COVER_sum(samplesSizes, nbSamples);
+   /* Split samples into testing and training sets */
+   const unsigned nbTrainSamples = splitPoint < 1.0 ? (unsigned)((double)nbSamples * splitPoint) : nbSamples;
+   const unsigned nbTestSamples = splitPoint < 1.0 ? nbSamples - nbTrainSamples : nbSamples;
+   const size_t trainingSamplesSize = splitPoint < 1.0 ? COVER_sum(samplesSizes, nbTrainSamples) : totalSamplesSize;
+   const size_t testSamplesSize = splitPoint < 1.0 ? COVER_sum(samplesSizes + nbTrainSamples, nbTestSamples) : totalSamplesSize;
+   /* Checks */
+   if (totalSamplesSize < MAX(d, sizeof(U64)) ||
+       totalSamplesSize >= (size_t)COVER_MAX_SAMPLES_SIZE) {
+     DISPLAYLEVEL(1, "Total samples size is too large (%u MB), maximum size is %u MB\n",
+                  (unsigned)(totalSamplesSize>>20), (COVER_MAX_SAMPLES_SIZE >> 20));
+     return 0;
+   }
+   /* Check if there are at least 5 training samples */
+   if (nbTrainSamples < 5) {
+     DISPLAYLEVEL(1, "Total number of training samples is %u and is invalid.", nbTrainSamples);
+     return 0;
+   }
+   /* Check if there's testing sample */
+   if (nbTestSamples < 1) {
+     DISPLAYLEVEL(1, "Total number of testing samples is %u and is invalid.", nbTestSamples);
+     return 0;
+   }
+   /* Zero the context */
+   memset(ctx, 0, sizeof(*ctx));
+   DISPLAYLEVEL(2, "Training on %u samples of total size %u\n", nbTrainSamples,
+                (unsigned)trainingSamplesSize);
+   DISPLAYLEVEL(2, "Testing on %u samples of total size %u\n", nbTestSamples,
+                (unsigned)testSamplesSize);
+   ctx->samples = samples;
+   ctx->samplesSizes = samplesSizes;
+   ctx->nbSamples = nbSamples;
+   ctx->nbTrainSamples = nbTrainSamples;
+   ctx->nbTestSamples = nbTestSamples;
+   /* Partial suffix array */
+   ctx->suffixSize = trainingSamplesSize - MAX(d, sizeof(U64)) + 1;
+   ctx->suffix = (U32 *)malloc(ctx->suffixSize * sizeof(U32));
+   /* Maps index to the dmerID */
+   ctx->dmerAt = (U32 *)malloc(ctx->suffixSize * sizeof(U32));
+   /* The offsets of each file */
+   ctx->offsets = (size_t *)malloc((nbSamples + 1) * sizeof(size_t));
+   if (!ctx->suffix || !ctx->dmerAt || !ctx->offsets) {
+     DISPLAYLEVEL(1, "Failed to allocate scratch buffers\n");
+     COVER_ctx_destroy(ctx);
+     return 0;
+   }
+   ctx->freqs = NULL;
+   ctx->d = d;
+ 
+   /* Fill offsets from the samplesSizes */
+   {
+     U32 i;
+     ctx->offsets[0] = 0;
+     for (i = 1; i <= nbSamples; ++i) {
+       ctx->offsets[i] = ctx->offsets[i - 1] + samplesSizes[i - 1];
+     }
+   }
+   DISPLAYLEVEL(2, "Constructing partial suffix array\n");
+   {
+     /* suffix is a partial suffix array.
+      * It only sorts suffixes by their first parameters.d bytes.
+      * The sort is stable, so each dmer group is sorted by position in input.
+      */
+     U32 i;
+     for (i = 0; i < ctx->suffixSize; ++i) {
+       ctx->suffix[i] = i;
+     }
+     /* qsort doesn't take an opaque pointer, so pass as a global.
+      * On OpenBSD qsort() is not guaranteed to be stable, their mergesort() is.
+      */
+     g_ctx = ctx;
+ #if defined(__OpenBSD__)
+     mergesort(ctx->suffix, ctx->suffixSize, sizeof(U32),
+           (ctx->d <= 8 ? &COVER_strict_cmp8 : &COVER_strict_cmp));
+ #else
+     qsort(ctx->suffix, ctx->suffixSize, sizeof(U32),
+           (ctx->d <= 8 ? &COVER_strict_cmp8 : &COVER_strict_cmp));
+ #endif
+   }
+   DISPLAYLEVEL(2, "Computing frequencies\n");
+   /* For each dmer group (group of positions with the same first d bytes):
+    * 1. For each position we set dmerAt[position] = dmerID.  The dmerID is
+    *    (groupBeginPtr - suffix).  This allows us to go from position to
+    *    dmerID so we can look up values in freq.
+    * 2. We calculate how many samples the dmer occurs in and save it in
+    *    freqs[dmerId].
+    */
+   COVER_groupBy(ctx->suffix, ctx->suffixSize, sizeof(U32), ctx,
+                 (ctx->d <= 8 ? &COVER_cmp8 : &COVER_cmp), &COVER_group);
+   ctx->freqs = ctx->suffix;
+   ctx->suffix = NULL;
+   return 1;
+ }
+ 
+ /**
+  * Given the prepared context build the dictionary.
+  */
+ static size_t COVER_buildDictionary(const COVER_ctx_t *ctx, U32 *freqs,
+                                     COVER_map_t *activeDmers, void *dictBuffer,
+                                     size_t dictBufferCapacity,
+                                     ZDICT_cover_params_t parameters) {
+   BYTE *const dict = (BYTE *)dictBuffer;
+   size_t tail = dictBufferCapacity;
+   /* Divide the data up into epochs of equal size.
+    * We will select at least one segment from each epoch.
+    */
+   const unsigned epochs = MAX(1, (U32)(dictBufferCapacity / parameters.k / 4));
+   const unsigned epochSize = (U32)(ctx->suffixSize / epochs);
+   size_t epoch;
+   DISPLAYLEVEL(2, "Breaking content into %u epochs of size %u\n",
+                 epochs, epochSize);
+   /* Loop through the epochs until there are no more segments or the dictionary
+    * is full.
+    */
+   for (epoch = 0; tail > 0; epoch = (epoch + 1) % epochs) {
+     const U32 epochBegin = (U32)(epoch * epochSize);
+     const U32 epochEnd = epochBegin + epochSize;
+     size_t segmentSize;
+     /* Select a segment */
+     COVER_segment_t segment = COVER_selectSegment(
+         ctx, freqs, activeDmers, epochBegin, epochEnd, parameters);
+     /* If the segment covers no dmers, then we are out of content */
+     if (segment.score == 0) {
+       break;
+     }
+     /* Trim the segment if necessary and if it is too small then we are done */
+     segmentSize = MIN(segment.end - segment.begin + parameters.d - 1, tail);
+     if (segmentSize < parameters.d) {
+       break;
+     }
+     /* We fill the dictionary from the back to allow the best segments to be
+      * referenced with the smallest offsets.
+      */
+     tail -= segmentSize;
+     memcpy(dict + tail, ctx->samples + segment.begin, segmentSize);
+     DISPLAYUPDATE(
+         2, "\r%u%%       ",
+         (unsigned)(((dictBufferCapacity - tail) * 100) / dictBufferCapacity));
+   }
+   DISPLAYLEVEL(2, "\r%79s\r", "");
+   return tail;
+ }
+ 
+ ZDICTLIB_API size_t ZDICT_trainFromBuffer_cover(
+     void *dictBuffer, size_t dictBufferCapacity,
+     const void *samplesBuffer, const size_t *samplesSizes, unsigned nbSamples,
+     ZDICT_cover_params_t parameters)
+ {
+   BYTE* const dict = (BYTE*)dictBuffer;
+   COVER_ctx_t ctx;
+   COVER_map_t activeDmers;
+   parameters.splitPoint = 1.0;
+   /* Initialize global data */
+   g_displayLevel = parameters.zParams.notificationLevel;
+   /* Checks */
+   if (!COVER_checkParameters(parameters, dictBufferCapacity)) {
+     DISPLAYLEVEL(1, "Cover parameters incorrect\n");
+     return ERROR(GENERIC);
+   }
+   if (nbSamples == 0) {
+     DISPLAYLEVEL(1, "Cover must have at least one input file\n");
+     return ERROR(GENERIC);
+   }
+   if (dictBufferCapacity < ZDICT_DICTSIZE_MIN) {
+     DISPLAYLEVEL(1, "dictBufferCapacity must be at least %u\n",
+                  ZDICT_DICTSIZE_MIN);
+     return ERROR(dstSize_tooSmall);
+   }
+   /* Initialize context and activeDmers */
+   if (!COVER_ctx_init(&ctx, samplesBuffer, samplesSizes, nbSamples,
+                       parameters.d, parameters.splitPoint)) {
+     return ERROR(GENERIC);
+   }
+   if (!COVER_map_init(&activeDmers, parameters.k - parameters.d + 1)) {
+     DISPLAYLEVEL(1, "Failed to allocate dmer map: out of memory\n");
+     COVER_ctx_destroy(&ctx);
+     return ERROR(GENERIC);
+   }
+ 
+   DISPLAYLEVEL(2, "Building dictionary\n");
+   {
+     const size_t tail =
+         COVER_buildDictionary(&ctx, ctx.freqs, &activeDmers, dictBuffer,
+                               dictBufferCapacity, parameters);
+     const size_t dictionarySize = ZDICT_finalizeDictionary(
+         dict, dictBufferCapacity, dict + tail, dictBufferCapacity - tail,
+         samplesBuffer, samplesSizes, nbSamples, parameters.zParams);
+     if (!ZSTD_isError(dictionarySize)) {
+       DISPLAYLEVEL(2, "Constructed dictionary of size %u\n",
+                    (unsigned)dictionarySize);
+     }
+     COVER_ctx_destroy(&ctx);
+     COVER_map_destroy(&activeDmers);
+     return dictionarySize;
+   }
+ }
+ 
+ 
+ 
+ size_t COVER_checkTotalCompressedSize(const ZDICT_cover_params_t parameters,
+                                     const size_t *samplesSizes, const BYTE *samples,
+                                     size_t *offsets,
+                                     size_t nbTrainSamples, size_t nbSamples,
+                                     BYTE *const dict, size_t dictBufferCapacity) {
+   size_t totalCompressedSize = ERROR(GENERIC);
+   /* Pointers */
+   ZSTD_CCtx *cctx;
+   ZSTD_CDict *cdict;
+   void *dst;
+   /* Local variables */
+   size_t dstCapacity;
+   size_t i;
+   /* Allocate dst with enough space to compress the maximum sized sample */
+   {
+     size_t maxSampleSize = 0;
+     i = parameters.splitPoint < 1.0 ? nbTrainSamples : 0;
+     for (; i < nbSamples; ++i) {
+       maxSampleSize = MAX(samplesSizes[i], maxSampleSize);
+     }
+     dstCapacity = ZSTD_compressBound(maxSampleSize);
+     dst = malloc(dstCapacity);
+   }
+   /* Create the cctx and cdict */
+   cctx = ZSTD_createCCtx();
+   cdict = ZSTD_createCDict(dict, dictBufferCapacity,
+                            parameters.zParams.compressionLevel);
+   if (!dst || !cctx || !cdict) {
+     goto _compressCleanup;
+   }
+   /* Compress each sample and sum their sizes (or error) */
+   totalCompressedSize = dictBufferCapacity;
+   i = parameters.splitPoint < 1.0 ? nbTrainSamples : 0;
+   for (; i < nbSamples; ++i) {
+     const size_t size = ZSTD_compress_usingCDict(
+         cctx, dst, dstCapacity, samples + offsets[i],
+         samplesSizes[i], cdict);
+     if (ZSTD_isError(size)) {
+       totalCompressedSize = ERROR(GENERIC);
+       goto _compressCleanup;
+     }
+     totalCompressedSize += size;
+   }
+ _compressCleanup:
+   ZSTD_freeCCtx(cctx);
+   ZSTD_freeCDict(cdict);
+   if (dst) {
+     free(dst);
+   }
+   return totalCompressedSize;
+ }
+ 
+ 
+ /**
+  * Initialize the `COVER_best_t`.
+  */
+ void COVER_best_init(COVER_best_t *best) {
+   if (best==NULL) return; /* compatible with init on NULL */
+   (void)ZSTD_pthread_mutex_init(&best->mutex, NULL);
+   (void)ZSTD_pthread_cond_init(&best->cond, NULL);
+   best->liveJobs = 0;
+   best->dict = NULL;
+   best->dictSize = 0;
+   best->compressedSize = (size_t)-1;
+   memset(&best->parameters, 0, sizeof(best->parameters));
+ }
+ 
+ /**
+  * Wait until liveJobs == 0.
+  */
+ void COVER_best_wait(COVER_best_t *best) {
+   if (!best) {
+     return;
+   }
+   ZSTD_pthread_mutex_lock(&best->mutex);
+   while (best->liveJobs != 0) {
+     ZSTD_pthread_cond_wait(&best->cond, &best->mutex);
+   }
+   ZSTD_pthread_mutex_unlock(&best->mutex);
+ }
+ 
+ /**
+  * Call COVER_best_wait() and then destroy the COVER_best_t.
+  */
+ void COVER_best_destroy(COVER_best_t *best) {
+   if (!best) {
+     return;
+   }
+   COVER_best_wait(best);
+   if (best->dict) {
+     free(best->dict);
+   }
+   ZSTD_pthread_mutex_destroy(&best->mutex);
+   ZSTD_pthread_cond_destroy(&best->cond);
+ }
+ 
+ /**
+  * Called when a thread is about to be launched.
+  * Increments liveJobs.
+  */
+ void COVER_best_start(COVER_best_t *best) {
+   if (!best) {
+     return;
+   }
+   ZSTD_pthread_mutex_lock(&best->mutex);
+   ++best->liveJobs;
+   ZSTD_pthread_mutex_unlock(&best->mutex);
+ }
+ 
+ /**
+  * Called when a thread finishes executing, both on error or success.
+  * Decrements liveJobs and signals any waiting threads if liveJobs == 0.
+  * If this dictionary is the best so far save it and its parameters.
+  */
+ void COVER_best_finish(COVER_best_t *best, size_t compressedSize,
+                               ZDICT_cover_params_t parameters, void *dict,
+                               size_t dictSize) {
+   if (!best) {
+     return;
+   }
+   {
+     size_t liveJobs;
+     ZSTD_pthread_mutex_lock(&best->mutex);
+     --best->liveJobs;
+     liveJobs = best->liveJobs;
+     /* If the new dictionary is better */
+     if (compressedSize < best->compressedSize) {
+       /* Allocate space if necessary */
+       if (!best->dict || best->dictSize < dictSize) {
+         if (best->dict) {
+           free(best->dict);
+         }
+         best->dict = malloc(dictSize);
+         if (!best->dict) {
+           best->compressedSize = ERROR(GENERIC);
+           best->dictSize = 0;
+           ZSTD_pthread_cond_signal(&best->cond);
+           ZSTD_pthread_mutex_unlock(&best->mutex);
+           return;
+         }
+       }
+       /* Save the dictionary, parameters, and size */
+       memcpy(best->dict, dict, dictSize);
+       best->dictSize = dictSize;
+       best->parameters = parameters;
+       best->compressedSize = compressedSize;
+     }
+     if (liveJobs == 0) {
+       ZSTD_pthread_cond_broadcast(&best->cond);
+     }
+     ZSTD_pthread_mutex_unlock(&best->mutex);
+   }
+ }
+ 
+ /**
+  * Parameters for COVER_tryParameters().
+  */
+ typedef struct COVER_tryParameters_data_s {
+   const COVER_ctx_t *ctx;
+   COVER_best_t *best;
+   size_t dictBufferCapacity;
+   ZDICT_cover_params_t parameters;
+ } COVER_tryParameters_data_t;
+ 
+ /**
+  * Tries a set of parameters and updates the COVER_best_t with the results.
+  * This function is thread safe if zstd is compiled with multithreaded support.
+  * It takes its parameters as an *OWNING* opaque pointer to support threading.
+  */
+ static void COVER_tryParameters(void *opaque) {
+   /* Save parameters as local variables */
+   COVER_tryParameters_data_t *const data = (COVER_tryParameters_data_t *)opaque;
+   const COVER_ctx_t *const ctx = data->ctx;
+   const ZDICT_cover_params_t parameters = data->parameters;
+   size_t dictBufferCapacity = data->dictBufferCapacity;
+   size_t totalCompressedSize = ERROR(GENERIC);
+   /* Allocate space for hash table, dict, and freqs */
+   COVER_map_t activeDmers;
+   BYTE *const dict = (BYTE * const)malloc(dictBufferCapacity);
+   U32 *freqs = (U32 *)malloc(ctx->suffixSize * sizeof(U32));
+   if (!COVER_map_init(&activeDmers, parameters.k - parameters.d + 1)) {
+     DISPLAYLEVEL(1, "Failed to allocate dmer map: out of memory\n");
+     goto _cleanup;
+   }
+   if (!dict || !freqs) {
+     DISPLAYLEVEL(1, "Failed to allocate buffers: out of memory\n");
+     goto _cleanup;
+   }
+   /* Copy the frequencies because we need to modify them */
+   memcpy(freqs, ctx->freqs, ctx->suffixSize * sizeof(U32));
+   /* Build the dictionary */
+   {
+     const size_t tail = COVER_buildDictionary(ctx, freqs, &activeDmers, dict,
+                                               dictBufferCapacity, parameters);
+     dictBufferCapacity = ZDICT_finalizeDictionary(
+         dict, dictBufferCapacity, dict + tail, dictBufferCapacity - tail,
+         ctx->samples, ctx->samplesSizes, (unsigned)ctx->nbTrainSamples,
+         parameters.zParams);
+     if (ZDICT_isError(dictBufferCapacity)) {
+       DISPLAYLEVEL(1, "Failed to finalize dictionary\n");
+       goto _cleanup;
+     }
+   }
+   /* Check total compressed size */
+   totalCompressedSize = COVER_checkTotalCompressedSize(parameters, ctx->samplesSizes,
+                                                        ctx->samples, ctx->offsets,
+                                                        ctx->nbTrainSamples, ctx->nbSamples,
+                                                        dict, dictBufferCapacity);
+ 
+ _cleanup:
+   COVER_best_finish(data->best, totalCompressedSize, parameters, dict,
+                     dictBufferCapacity);
+   free(data);
+   COVER_map_destroy(&activeDmers);
+   if (dict) {
+     free(dict);
+   }
+   if (freqs) {
+     free(freqs);
+   }
+ }
+ 
+ ZDICTLIB_API size_t ZDICT_optimizeTrainFromBuffer_cover(
+     void *dictBuffer, size_t dictBufferCapacity, const void *samplesBuffer,
+     const size_t *samplesSizes, unsigned nbSamples,
+     ZDICT_cover_params_t *parameters) {
+   /* constants */
+   const unsigned nbThreads = parameters->nbThreads;
+   const double splitPoint =
+       parameters->splitPoint <= 0.0 ? DEFAULT_SPLITPOINT : parameters->splitPoint;
+   const unsigned kMinD = parameters->d == 0 ? 6 : parameters->d;
+   const unsigned kMaxD = parameters->d == 0 ? 8 : parameters->d;
+   const unsigned kMinK = parameters->k == 0 ? 50 : parameters->k;
+   const unsigned kMaxK = parameters->k == 0 ? 2000 : parameters->k;
+   const unsigned kSteps = parameters->steps == 0 ? 40 : parameters->steps;
+   const unsigned kStepSize = MAX((kMaxK - kMinK) / kSteps, 1);
+   const unsigned kIterations =
+       (1 + (kMaxD - kMinD) / 2) * (1 + (kMaxK - kMinK) / kStepSize);
+   /* Local variables */
+   const int displayLevel = parameters->zParams.notificationLevel;
+   unsigned iteration = 1;
+   unsigned d;
+   unsigned k;
+   COVER_best_t best;
+   POOL_ctx *pool = NULL;
+ 
+   /* Checks */
+   if (splitPoint <= 0 || splitPoint > 1) {
+     LOCALDISPLAYLEVEL(displayLevel, 1, "Incorrect parameters\n");
+     return ERROR(GENERIC);
+   }
+   if (kMinK < kMaxD || kMaxK < kMinK) {
+     LOCALDISPLAYLEVEL(displayLevel, 1, "Incorrect parameters\n");
+     return ERROR(GENERIC);
+   }
+   if (nbSamples == 0) {
+     DISPLAYLEVEL(1, "Cover must have at least one input file\n");
+     return ERROR(GENERIC);
+   }
+   if (dictBufferCapacity < ZDICT_DICTSIZE_MIN) {
+     DISPLAYLEVEL(1, "dictBufferCapacity must be at least %u\n",
+                  ZDICT_DICTSIZE_MIN);
+     return ERROR(dstSize_tooSmall);
+   }
+   if (nbThreads > 1) {
+     pool = POOL_create(nbThreads, 1);
+     if (!pool) {
+       return ERROR(memory_allocation);
+     }
+   }
+   /* Initialization */
+   COVER_best_init(&best);
+   /* Turn down global display level to clean up display at level 2 and below */
+   g_displayLevel = displayLevel == 0 ? 0 : displayLevel - 1;
+   /* Loop through d first because each new value needs a new context */
+   LOCALDISPLAYLEVEL(displayLevel, 2, "Trying %u different sets of parameters\n",
+                     kIterations);
+   for (d = kMinD; d <= kMaxD; d += 2) {
+     /* Initialize the context for this value of d */
+     COVER_ctx_t ctx;
+     LOCALDISPLAYLEVEL(displayLevel, 3, "d=%u\n", d);
+     if (!COVER_ctx_init(&ctx, samplesBuffer, samplesSizes, nbSamples, d, splitPoint)) {
+       LOCALDISPLAYLEVEL(displayLevel, 1, "Failed to initialize context\n");
+       COVER_best_destroy(&best);
+       POOL_free(pool);
+       return ERROR(GENERIC);
+     }
+     /* Loop through k reusing the same context */
+     for (k = kMinK; k <= kMaxK; k += kStepSize) {
+       /* Prepare the arguments */
+       COVER_tryParameters_data_t *data = (COVER_tryParameters_data_t *)malloc(
+           sizeof(COVER_tryParameters_data_t));
+       LOCALDISPLAYLEVEL(displayLevel, 3, "k=%u\n", k);
+       if (!data) {
+         LOCALDISPLAYLEVEL(displayLevel, 1, "Failed to allocate parameters\n");
+         COVER_best_destroy(&best);
+         COVER_ctx_destroy(&ctx);
+         POOL_free(pool);
+         return ERROR(GENERIC);
+       }
+       data->ctx = &ctx;
+       data->best = &best;
+       data->dictBufferCapacity = dictBufferCapacity;
+       data->parameters = *parameters;
+       data->parameters.k = k;
+       data->parameters.d = d;
+       data->parameters.splitPoint = splitPoint;
+       data->parameters.steps = kSteps;
+       data->parameters.zParams.notificationLevel = g_displayLevel;
+       /* Check the parameters */
+       if (!COVER_checkParameters(data->parameters, dictBufferCapacity)) {
+         DISPLAYLEVEL(1, "Cover parameters incorrect\n");
+         free(data);
+         continue;
+       }
+       /* Call the function and pass ownership of data to it */
+       COVER_best_start(&best);
+       if (pool) {
+         POOL_add(pool, &COVER_tryParameters, data);
+       } else {
+         COVER_tryParameters(data);
+       }
+       /* Print status */
+       LOCALDISPLAYUPDATE(displayLevel, 2, "\r%u%%       ",
+                          (unsigned)((iteration * 100) / kIterations));
+       ++iteration;
+     }
+     COVER_best_wait(&best);
+     COVER_ctx_destroy(&ctx);
+   }
+   LOCALDISPLAYLEVEL(displayLevel, 2, "\r%79s\r", "");
+   /* Fill the output buffer and parameters with output of the best parameters */
+   {
+     const size_t dictSize = best.dictSize;
+     if (ZSTD_isError(best.compressedSize)) {
+       const size_t compressedSize = best.compressedSize;
+       COVER_best_destroy(&best);
+       POOL_free(pool);
+       return compressedSize;
+     }
+     *parameters = best.parameters;
+     memcpy(dictBuffer, best.dict, dictSize);
+     COVER_best_destroy(&best);
+     POOL_free(pool);
+     return dictSize;
+   }
+ }
--- a/vendor/github.com/DataDog/zstd/cover.h 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/cover.h 0 → 100644
查看文件 @4f5343b
+ #include <stdio.h>  /* fprintf */
+ #include <stdlib.h> /* malloc, free, qsort */
+ #include <string.h> /* memset */
+ #include <time.h>   /* clock */
+ #include "mem.h" /* read */
+ #include "pool.h"
+ #include "threading.h"
+ #include "zstd_internal.h" /* includes zstd.h */
+ #ifndef ZDICT_STATIC_LINKING_ONLY
+ #define ZDICT_STATIC_LINKING_ONLY
+ #endif
+ #include "zdict.h"
+ 
+ /**
+  * COVER_best_t is used for two purposes:
+  * 1. Synchronizing threads.
+  * 2. Saving the best parameters and dictionary.
+  *
+  * All of the methods except COVER_best_init() are thread safe if zstd is
+  * compiled with multithreaded support.
+  */
+ typedef struct COVER_best_s {
+   ZSTD_pthread_mutex_t mutex;
+   ZSTD_pthread_cond_t cond;
+   size_t liveJobs;
+   void *dict;
+   size_t dictSize;
+   ZDICT_cover_params_t parameters;
+   size_t compressedSize;
+ } COVER_best_t;
+ 
+ /**
+  * A segment is a range in the source as well as the score of the segment.
+  */
+ typedef struct {
+   U32 begin;
+   U32 end;
+   U32 score;
+ } COVER_segment_t;
+ 
+ /**
+  *  Checks total compressed size of a dictionary
+  */
+ size_t COVER_checkTotalCompressedSize(const ZDICT_cover_params_t parameters,
+                                       const size_t *samplesSizes, const BYTE *samples,
+                                       size_t *offsets,
+                                       size_t nbTrainSamples, size_t nbSamples,
+                                       BYTE *const dict, size_t dictBufferCapacity);
+ 
+ /**
+  * Returns the sum of the sample sizes.
+  */
+ size_t COVER_sum(const size_t *samplesSizes, unsigned nbSamples) ;
+ 
+ /**
+  * Initialize the `COVER_best_t`.
+  */
+ void COVER_best_init(COVER_best_t *best);
+ 
+ /**
+  * Wait until liveJobs == 0.
+  */
+ void COVER_best_wait(COVER_best_t *best);
+ 
+ /**
+  * Call COVER_best_wait() and then destroy the COVER_best_t.
+  */
+ void COVER_best_destroy(COVER_best_t *best);
+ 
+ /**
+  * Called when a thread is about to be launched.
+  * Increments liveJobs.
+  */
+ void COVER_best_start(COVER_best_t *best);
+ 
+ /**
+  * Called when a thread finishes executing, both on error or success.
+  * Decrements liveJobs and signals any waiting threads if liveJobs == 0.
+  * If this dictionary is the best so far save it and its parameters.
+  */
+ void COVER_best_finish(COVER_best_t *best, size_t compressedSize,
+                        ZDICT_cover_params_t parameters, void *dict,
+                        size_t dictSize);
--- a/vendor/github.com/DataDog/zstd/cpu.h 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/cpu.h 0 → 100644
查看文件 @4f5343b
+ /*
+  * Copyright (c) 2018-present, Facebook, Inc.
+  * All rights reserved.
+  *
+  * This source code is licensed under both the BSD-style license (found in the
+  * LICENSE file in the root directory of this source tree) and the GPLv2 (found
+  * in the COPYING file in the root directory of this source tree).
+  * You may select, at your option, one of the above-listed licenses.
+  */
+ 
+ #ifndef ZSTD_COMMON_CPU_H
+ #define ZSTD_COMMON_CPU_H
+ 
+ /**
+  * Implementation taken from folly/CpuId.h
+  * https://github.com/facebook/folly/blob/master/folly/CpuId.h
+  */
+ 
+ #include <string.h>
+ 
+ #include "mem.h"
+ 
+ #ifdef _MSC_VER
+ #include <intrin.h>
+ #endif
+ 
+ typedef struct {
+     U32 f1c;
+     U32 f1d;
+     U32 f7b;
+     U32 f7c;
+ } ZSTD_cpuid_t;
+ 
+ MEM_STATIC ZSTD_cpuid_t ZSTD_cpuid(void) {
+     U32 f1c = 0;
+     U32 f1d = 0;
+     U32 f7b = 0;
+     U32 f7c = 0;
+ #if defined(_MSC_VER) && (defined(_M_X64) || defined(_M_IX86))
+     int reg[4];
+     __cpuid((int*)reg, 0);
+     {
+         int const n = reg[0];
+         if (n >= 1) {
+             __cpuid((int*)reg, 1);
+             f1c = (U32)reg[2];
+             f1d = (U32)reg[3];
+         }
+         if (n >= 7) {
+             __cpuidex((int*)reg, 7, 0);
+             f7b = (U32)reg[1];
+             f7c = (U32)reg[2];
+         }
+     }
+ #elif defined(__i386__) && defined(__PIC__) && !defined(__clang__) && defined(__GNUC__)
+     /* The following block like the normal cpuid branch below, but gcc
+      * reserves ebx for use of its pic register so we must specially
+      * handle the save and restore to avoid clobbering the register
+      */
+     U32 n;
+     __asm__(
+         "pushl %%ebx\n\t"
+         "cpuid\n\t"
+         "popl %%ebx\n\t"
+         : "=a"(n)
+         : "a"(0)
+         : "ecx", "edx");
+     if (n >= 1) {
+       U32 f1a;
+       __asm__(
+           "pushl %%ebx\n\t"
+           "cpuid\n\t"
+           "popl %%ebx\n\t"
+           : "=a"(f1a), "=c"(f1c), "=d"(f1d)
+           : "a"(1));
+     }
+     if (n >= 7) {
+       __asm__(
+           "pushl %%ebx\n\t"
+           "cpuid\n\t"
+           "movl %%ebx, %%eax\n\t"
+           "popl %%ebx"
+           : "=a"(f7b), "=c"(f7c)
+           : "a"(7), "c"(0)
+           : "edx");
+     }
+ #elif defined(__x86_64__) || defined(_M_X64) || defined(__i386__)
+     U32 n;
+     __asm__("cpuid" : "=a"(n) : "a"(0) : "ebx", "ecx", "edx");
+     if (n >= 1) {
+       U32 f1a;
+       __asm__("cpuid" : "=a"(f1a), "=c"(f1c), "=d"(f1d) : "a"(1) : "ebx");
+     }
+     if (n >= 7) {
+       U32 f7a;
+       __asm__("cpuid"
+               : "=a"(f7a), "=b"(f7b), "=c"(f7c)
+               : "a"(7), "c"(0)
+               : "edx");
+     }
+ #endif
+     {
+         ZSTD_cpuid_t cpuid;
+         cpuid.f1c = f1c;
+         cpuid.f1d = f1d;
+         cpuid.f7b = f7b;
+         cpuid.f7c = f7c;
+         return cpuid;
+     }
+ }
+ 
+ #define X(name, r, bit)                                                        \
+   MEM_STATIC int ZSTD_cpuid_##name(ZSTD_cpuid_t const cpuid) {                 \
+     return ((cpuid.r) & (1U << bit)) != 0;                                     \
+   }
+ 
+ /* cpuid(1): Processor Info and Feature Bits. */
+ #define C(name, bit) X(name, f1c, bit)
+   C(sse3, 0)
+   C(pclmuldq, 1)
+   C(dtes64, 2)
+   C(monitor, 3)
+   C(dscpl, 4)
+   C(vmx, 5)
+   C(smx, 6)
+   C(eist, 7)
+   C(tm2, 8)
+   C(ssse3, 9)
+   C(cnxtid, 10)
+   C(fma, 12)
+   C(cx16, 13)
+   C(xtpr, 14)
+   C(pdcm, 15)
+   C(pcid, 17)
+   C(dca, 18)
+   C(sse41, 19)
+   C(sse42, 20)
+   C(x2apic, 21)
+   C(movbe, 22)
+   C(popcnt, 23)
+   C(tscdeadline, 24)
+   C(aes, 25)
+   C(xsave, 26)
+   C(osxsave, 27)
+   C(avx, 28)
+   C(f16c, 29)
+   C(rdrand, 30)
+ #undef C
+ #define D(name, bit) X(name, f1d, bit)
+   D(fpu, 0)
+   D(vme, 1)
+   D(de, 2)
+   D(pse, 3)
+   D(tsc, 4)
+   D(msr, 5)
+   D(pae, 6)
+   D(mce, 7)
+   D(cx8, 8)
+   D(apic, 9)
+   D(sep, 11)
+   D(mtrr, 12)
+   D(pge, 13)
+   D(mca, 14)
+   D(cmov, 15)
+   D(pat, 16)
+   D(pse36, 17)
+   D(psn, 18)
+   D(clfsh, 19)
+   D(ds, 21)
+   D(acpi, 22)
+   D(mmx, 23)
+   D(fxsr, 24)
+   D(sse, 25)
+   D(sse2, 26)
+   D(ss, 27)
+   D(htt, 28)
+   D(tm, 29)
+   D(pbe, 31)
+ #undef D
+ 
+ /* cpuid(7): Extended Features. */
+ #define B(name, bit) X(name, f7b, bit)
+   B(bmi1, 3)
+   B(hle, 4)
+   B(avx2, 5)
+   B(smep, 7)
+   B(bmi2, 8)
+   B(erms, 9)
+   B(invpcid, 10)
+   B(rtm, 11)
+   B(mpx, 14)
+   B(avx512f, 16)
+   B(avx512dq, 17)
+   B(rdseed, 18)
+   B(adx, 19)
+   B(smap, 20)
+   B(avx512ifma, 21)
+   B(pcommit, 22)
+   B(clflushopt, 23)
+   B(clwb, 24)
+   B(avx512pf, 26)
+   B(avx512er, 27)
+   B(avx512cd, 28)
+   B(sha, 29)
+   B(avx512bw, 30)
+   B(avx512vl, 31)
+ #undef B
+ #define C(name, bit) X(name, f7c, bit)
+   C(prefetchwt1, 0)
+   C(avx512vbmi, 1)
+ #undef C
+ 
+ #undef X
+ 
+ #endif /* ZSTD_COMMON_CPU_H */
--- a/vendor/github.com/DataDog/zstd/debug.c 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/debug.c 0 → 100644
查看文件 @4f5343b
+ /* ******************************************************************
+    debug
+    Part of FSE library
+    Copyright (C) 2013-present, Yann Collet.
+ 
+    BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
+ 
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions are
+    met:
+ 
+        * Redistributions of source code must retain the above copyright
+    notice, this list of conditions and the following disclaimer.
+        * Redistributions in binary form must reproduce the above
+    copyright notice, this list of conditions and the following disclaimer
+    in the documentation and/or other materials provided with the
+    distribution.
+ 
+    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+    "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+    OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+    SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+    LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+    DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+    THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+    (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+    OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ 
+    You can contact the author at :
+    - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
+ ****************************************************************** */
+ 
+ 
+ /*
+  * This module only hosts one global variable
+  * which can be used to dynamically influence the verbosity of traces,
+  * such as DEBUGLOG and RAWLOG
+  */
+ 
+ #include "debug.h"
+ 
+ int g_debuglevel = DEBUGLEVEL;
--- a/vendor/github.com/DataDog/zstd/debug.h 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/debug.h 0 → 100644
查看文件 @4f5343b
+ /* ******************************************************************
+    debug
+    Part of FSE library
+    Copyright (C) 2013-present, Yann Collet.
+ 
+    BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
+ 
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions are
+    met:
+ 
+        * Redistributions of source code must retain the above copyright
+    notice, this list of conditions and the following disclaimer.
+        * Redistributions in binary form must reproduce the above
+    copyright notice, this list of conditions and the following disclaimer
+    in the documentation and/or other materials provided with the
+    distribution.
+ 
+    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+    "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+    OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+    SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+    LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+    DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+    THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+    (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+    OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ 
+    You can contact the author at :
+    - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
+ ****************************************************************** */
+ 
+ 
+ /*
+  * The purpose of this header is to enable debug functions.
+  * They regroup assert(), DEBUGLOG() and RAWLOG() for run-time,
+  * and DEBUG_STATIC_ASSERT() for compile-time.
+  *
+  * By default, DEBUGLEVEL==0, which means run-time debug is disabled.
+  *
+  * Level 1 enables assert() only.
+  * Starting level 2, traces can be generated and pushed to stderr.
+  * The higher the level, the more verbose the traces.
+  *
+  * It's possible to dynamically adjust level using variable g_debug_level,
+  * which is only declared if DEBUGLEVEL>=2,
+  * and is a global variable, not multi-thread protected (use with care)
+  */
+ 
+ #ifndef DEBUG_H_12987983217
+ #define DEBUG_H_12987983217
+ 
+ #if defined (__cplusplus)
+ extern "C" {
+ #endif
+ 
+ 
+ /* static assert is triggered at compile time, leaving no runtime artefact.
+  * static assert only works with compile-time constants.
+  * Also, this variant can only be used inside a function. */
+ #define DEBUG_STATIC_ASSERT(c) (void)sizeof(char[(c) ? 1 : -1])
+ 
+ 
+ /* DEBUGLEVEL is expected to be defined externally,
+  * typically through compiler command line.
+  * Value must be a number. */
+ #ifndef DEBUGLEVEL
+ #  define DEBUGLEVEL 0
+ #endif
+ 
+ 
+ /* DEBUGFILE can be defined externally,
+  * typically through compiler command line.
+  * note : currently useless.
+  * Value must be stderr or stdout */
+ #ifndef DEBUGFILE
+ #  define DEBUGFILE stderr
+ #endif
+ 
+ 
+ /* recommended values for DEBUGLEVEL :
+  * 0 : release mode, no debug, all run-time checks disabled
+  * 1 : enables assert() only, no display
+  * 2 : reserved, for currently active debug path
+  * 3 : events once per object lifetime (CCtx, CDict, etc.)
+  * 4 : events once per frame
+  * 5 : events once per block
+  * 6 : events once per sequence (verbose)
+  * 7+: events at every position (*very* verbose)
+  *
+  * It's generally inconvenient to output traces > 5.
+  * In which case, it's possible to selectively trigger high verbosity levels
+  * by modifying g_debug_level.
+  */
+ 
+ #if (DEBUGLEVEL>=1)
+ #  include <assert.h>
+ #else
+ #  ifndef assert   /* assert may be already defined, due to prior #include <assert.h> */
+ #    define assert(condition) ((void)0)   /* disable assert (default) */
+ #  endif
+ #endif
+ 
+ #if (DEBUGLEVEL>=2)
+ #  include <stdio.h>
+ extern int g_debuglevel; /* the variable is only declared,
+                             it actually lives in debug.c,
+                             and is shared by the whole process.
+                             It's not thread-safe.
+                             It's useful when enabling very verbose levels
+                             on selective conditions (such as position in src) */
+ 
+ #  define RAWLOG(l, ...) {                                      \
+                 if (l<=g_debuglevel) {                          \
+                     fprintf(stderr, __VA_ARGS__);               \
+             }   }
+ #  define DEBUGLOG(l, ...) {                                    \
+                 if (l<=g_debuglevel) {                          \
+                     fprintf(stderr, __FILE__ ": " __VA_ARGS__); \
+                     fprintf(stderr, " \n");                     \
+             }   }
+ #else
+ #  define RAWLOG(l, ...)      {}    /* disabled */
+ #  define DEBUGLOG(l, ...)    {}    /* disabled */
+ #endif
+ 
+ 
+ #if defined (__cplusplus)
+ }
+ #endif
+ 
+ #endif /* DEBUG_H_12987983217 */
--- a/vendor/github.com/DataDog/zstd/divsufsort.c 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/divsufsort.c 0 → 100644
查看文件 @4f5343b
+ /*
+  * divsufsort.c for libdivsufsort-lite
+  * Copyright (c) 2003-2008 Yuta Mori All Rights Reserved.
+  *
+  * Permission is hereby granted, free of charge, to any person
+  * obtaining a copy of this software and associated documentation
+  * files (the "Software"), to deal in the Software without
+  * restriction, including without limitation the rights to use,
+  * copy, modify, merge, publish, distribute, sublicense, and/or sell
+  * copies of the Software, and to permit persons to whom the
+  * Software is furnished to do so, subject to the following
+  * conditions:
+  *
+  * The above copyright notice and this permission notice shall be
+  * included in all copies or substantial portions of the Software.
+  *
+  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+  * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+  * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+  * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+  * OTHER DEALINGS IN THE SOFTWARE.
+  */
+ 
+ /*- Compiler specifics -*/
+ #ifdef __clang__
+ #pragma clang diagnostic ignored "-Wshorten-64-to-32"
+ #endif
+ 
+ #if defined(_MSC_VER)
+ #  pragma warning(disable : 4244)
+ #  pragma warning(disable : 4127)    /* C4127 : Condition expression is constant */
+ #endif
+ 
+ 
+ /*- Dependencies -*/
+ #include <assert.h>
+ #include <stdio.h>
+ #include <stdlib.h>
+ 
+ #include "divsufsort.h"
+ 
+ /*- Constants -*/
+ #if defined(INLINE)
+ # undef INLINE
+ #endif
+ #if !defined(INLINE)
+ # define INLINE __inline
+ #endif
+ #if defined(ALPHABET_SIZE) && (ALPHABET_SIZE < 1)
+ # undef ALPHABET_SIZE
+ #endif
+ #if !defined(ALPHABET_SIZE)
+ # define ALPHABET_SIZE (256)
+ #endif
+ #define BUCKET_A_SIZE (ALPHABET_SIZE)
+ #define BUCKET_B_SIZE (ALPHABET_SIZE * ALPHABET_SIZE)
+ #if defined(SS_INSERTIONSORT_THRESHOLD)
+ # if SS_INSERTIONSORT_THRESHOLD < 1
+ #  undef SS_INSERTIONSORT_THRESHOLD
+ #  define SS_INSERTIONSORT_THRESHOLD (1)
+ # endif
+ #else
+ # define SS_INSERTIONSORT_THRESHOLD (8)
+ #endif
+ #if defined(SS_BLOCKSIZE)
+ # if SS_BLOCKSIZE < 0
+ #  undef SS_BLOCKSIZE
+ #  define SS_BLOCKSIZE (0)
+ # elif 32768 <= SS_BLOCKSIZE
+ #  undef SS_BLOCKSIZE
+ #  define SS_BLOCKSIZE (32767)
+ # endif
+ #else
+ # define SS_BLOCKSIZE (1024)
+ #endif
+ /* minstacksize = log(SS_BLOCKSIZE) / log(3) * 2 */
+ #if SS_BLOCKSIZE == 0
+ # define SS_MISORT_STACKSIZE (96)
+ #elif SS_BLOCKSIZE <= 4096
+ # define SS_MISORT_STACKSIZE (16)
+ #else
+ # define SS_MISORT_STACKSIZE (24)
+ #endif
+ #define SS_SMERGE_STACKSIZE (32)
+ #define TR_INSERTIONSORT_THRESHOLD (8)
+ #define TR_STACKSIZE (64)
+ 
+ 
+ /*- Macros -*/
+ #ifndef SWAP
+ # define SWAP(_a, _b) do { t = (_a); (_a) = (_b); (_b) = t; } while(0)
+ #endif /* SWAP */
+ #ifndef MIN
+ # define MIN(_a, _b) (((_a) < (_b)) ? (_a) : (_b))
+ #endif /* MIN */
+ #ifndef MAX
+ # define MAX(_a, _b) (((_a) > (_b)) ? (_a) : (_b))
+ #endif /* MAX */
+ #define STACK_PUSH(_a, _b, _c, _d)\
+   do {\
+     assert(ssize < STACK_SIZE);\
+     stack[ssize].a = (_a), stack[ssize].b = (_b),\
+     stack[ssize].c = (_c), stack[ssize++].d = (_d);\
+   } while(0)
+ #define STACK_PUSH5(_a, _b, _c, _d, _e)\
+   do {\
+     assert(ssize < STACK_SIZE);\
+     stack[ssize].a = (_a), stack[ssize].b = (_b),\
+     stack[ssize].c = (_c), stack[ssize].d = (_d), stack[ssize++].e = (_e);\
+   } while(0)
+ #define STACK_POP(_a, _b, _c, _d)\
+   do {\
+     assert(0 <= ssize);\
+     if(ssize == 0) { return; }\
+     (_a) = stack[--ssize].a, (_b) = stack[ssize].b,\
+     (_c) = stack[ssize].c, (_d) = stack[ssize].d;\
+   } while(0)
+ #define STACK_POP5(_a, _b, _c, _d, _e)\
+   do {\
+     assert(0 <= ssize);\
+     if(ssize == 0) { return; }\
+     (_a) = stack[--ssize].a, (_b) = stack[ssize].b,\
+     (_c) = stack[ssize].c, (_d) = stack[ssize].d, (_e) = stack[ssize].e;\
+   } while(0)
+ #define BUCKET_A(_c0) bucket_A[(_c0)]
+ #if ALPHABET_SIZE == 256
+ #define BUCKET_B(_c0, _c1) (bucket_B[((_c1) << 8) | (_c0)])
+ #define BUCKET_BSTAR(_c0, _c1) (bucket_B[((_c0) << 8) | (_c1)])
+ #else
+ #define BUCKET_B(_c0, _c1) (bucket_B[(_c1) * ALPHABET_SIZE + (_c0)])
+ #define BUCKET_BSTAR(_c0, _c1) (bucket_B[(_c0) * ALPHABET_SIZE + (_c1)])
+ #endif
+ 
+ 
+ /*- Private Functions -*/
+ 
+ static const int lg_table[256]= {
+  -1,0,1,1,2,2,2,2,3,3,3,3,3,3,3,3,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,
+   5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,
+   6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,
+   6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,
+   7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,
+   7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,
+   7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,
+   7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7
+ };
+ 
+ #if (SS_BLOCKSIZE == 0) || (SS_INSERTIONSORT_THRESHOLD < SS_BLOCKSIZE)
+ 
+ static INLINE
+ int
+ ss_ilg(int n) {
+ #if SS_BLOCKSIZE == 0
+   return (n & 0xffff0000) ?
+           ((n & 0xff000000) ?
+             24 + lg_table[(n >> 24) & 0xff] :
+             16 + lg_table[(n >> 16) & 0xff]) :
+           ((n & 0x0000ff00) ?
+              8 + lg_table[(n >>  8) & 0xff] :
+              0 + lg_table[(n >>  0) & 0xff]);
+ #elif SS_BLOCKSIZE < 256
+   return lg_table[n];
+ #else
+   return (n & 0xff00) ?
+           8 + lg_table[(n >> 8) & 0xff] :
+           0 + lg_table[(n >> 0) & 0xff];
+ #endif
+ }
+ 
+ #endif /* (SS_BLOCKSIZE == 0) || (SS_INSERTIONSORT_THRESHOLD < SS_BLOCKSIZE) */
+ 
+ #if SS_BLOCKSIZE != 0
+ 
+ static const int sqq_table[256] = {
+   0,  16,  22,  27,  32,  35,  39,  42,  45,  48,  50,  53,  55,  57,  59,  61,
+  64,  65,  67,  69,  71,  73,  75,  76,  78,  80,  81,  83,  84,  86,  87,  89,
+  90,  91,  93,  94,  96,  97,  98,  99, 101, 102, 103, 104, 106, 107, 108, 109,
+ 110, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126,
+ 128, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142,
+ 143, 144, 144, 145, 146, 147, 148, 149, 150, 150, 151, 152, 153, 154, 155, 155,
+ 156, 157, 158, 159, 160, 160, 161, 162, 163, 163, 164, 165, 166, 167, 167, 168,
+ 169, 170, 170, 171, 172, 173, 173, 174, 175, 176, 176, 177, 178, 178, 179, 180,
+ 181, 181, 182, 183, 183, 184, 185, 185, 186, 187, 187, 188, 189, 189, 190, 191,
+ 192, 192, 193, 193, 194, 195, 195, 196, 197, 197, 198, 199, 199, 200, 201, 201,
+ 202, 203, 203, 204, 204, 205, 206, 206, 207, 208, 208, 209, 209, 210, 211, 211,
+ 212, 212, 213, 214, 214, 215, 215, 216, 217, 217, 218, 218, 219, 219, 220, 221,
+ 221, 222, 222, 223, 224, 224, 225, 225, 226, 226, 227, 227, 228, 229, 229, 230,
+ 230, 231, 231, 232, 232, 233, 234, 234, 235, 235, 236, 236, 237, 237, 238, 238,
+ 239, 240, 240, 241, 241, 242, 242, 243, 243, 244, 244, 245, 245, 246, 246, 247,
+ 247, 248, 248, 249, 249, 250, 250, 251, 251, 252, 252, 253, 253, 254, 254, 255
+ };
+ 
+ static INLINE
+ int
+ ss_isqrt(int x) {
+   int y, e;
+ 
+   if(x >= (SS_BLOCKSIZE * SS_BLOCKSIZE)) { return SS_BLOCKSIZE; }
+   e = (x & 0xffff0000) ?
+         ((x & 0xff000000) ?
+           24 + lg_table[(x >> 24) & 0xff] :
+           16 + lg_table[(x >> 16) & 0xff]) :
+         ((x & 0x0000ff00) ?
+            8 + lg_table[(x >>  8) & 0xff] :
+            0 + lg_table[(x >>  0) & 0xff]);
+ 
+   if(e >= 16) {
+     y = sqq_table[x >> ((e - 6) - (e & 1))] << ((e >> 1) - 7);
+     if(e >= 24) { y = (y + 1 + x / y) >> 1; }
+     y = (y + 1 + x / y) >> 1;
+   } else if(e >= 8) {
+     y = (sqq_table[x >> ((e - 6) - (e & 1))] >> (7 - (e >> 1))) + 1;
+   } else {
+     return sqq_table[x] >> 4;
+   }
+ 
+   return (x < (y * y)) ? y - 1 : y;
+ }
+ 
+ #endif /* SS_BLOCKSIZE != 0 */
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ /* Compares two suffixes. */
+ static INLINE
+ int
+ ss_compare(const unsigned char *T,
+            const int *p1, const int *p2,
+            int depth) {
+   const unsigned char *U1, *U2, *U1n, *U2n;
+ 
+   for(U1 = T + depth + *p1,
+       U2 = T + depth + *p2,
+       U1n = T + *(p1 + 1) + 2,
+       U2n = T + *(p2 + 1) + 2;
+       (U1 < U1n) && (U2 < U2n) && (*U1 == *U2);
+       ++U1, ++U2) {
+   }
+ 
+   return U1 < U1n ?
+         (U2 < U2n ? *U1 - *U2 : 1) :
+         (U2 < U2n ? -1 : 0);
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ #if (SS_BLOCKSIZE != 1) && (SS_INSERTIONSORT_THRESHOLD != 1)
+ 
+ /* Insertionsort for small size groups */
+ static
+ void
+ ss_insertionsort(const unsigned char *T, const int *PA,
+                  int *first, int *last, int depth) {
+   int *i, *j;
+   int t;
+   int r;
+ 
+   for(i = last - 2; first <= i; --i) {
+     for(t = *i, j = i + 1; 0 < (r = ss_compare(T, PA + t, PA + *j, depth));) {
+       do { *(j - 1) = *j; } while((++j < last) && (*j < 0));
+       if(last <= j) { break; }
+     }
+     if(r == 0) { *j = ~*j; }
+     *(j - 1) = t;
+   }
+ }
+ 
+ #endif /* (SS_BLOCKSIZE != 1) && (SS_INSERTIONSORT_THRESHOLD != 1) */
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ #if (SS_BLOCKSIZE == 0) || (SS_INSERTIONSORT_THRESHOLD < SS_BLOCKSIZE)
+ 
+ static INLINE
+ void
+ ss_fixdown(const unsigned char *Td, const int *PA,
+            int *SA, int i, int size) {
+   int j, k;
+   int v;
+   int c, d, e;
+ 
+   for(v = SA[i], c = Td[PA[v]]; (j = 2 * i + 1) < size; SA[i] = SA[k], i = k) {
+     d = Td[PA[SA[k = j++]]];
+     if(d < (e = Td[PA[SA[j]]])) { k = j; d = e; }
+     if(d <= c) { break; }
+   }
+   SA[i] = v;
+ }
+ 
+ /* Simple top-down heapsort. */
+ static
+ void
+ ss_heapsort(const unsigned char *Td, const int *PA, int *SA, int size) {
+   int i, m;
+   int t;
+ 
+   m = size;
+   if((size % 2) == 0) {
+     m--;
+     if(Td[PA[SA[m / 2]]] < Td[PA[SA[m]]]) { SWAP(SA[m], SA[m / 2]); }
+   }
+ 
+   for(i = m / 2 - 1; 0 <= i; --i) { ss_fixdown(Td, PA, SA, i, m); }
+   if((size % 2) == 0) { SWAP(SA[0], SA[m]); ss_fixdown(Td, PA, SA, 0, m); }
+   for(i = m - 1; 0 < i; --i) {
+     t = SA[0], SA[0] = SA[i];
+     ss_fixdown(Td, PA, SA, 0, i);
+     SA[i] = t;
+   }
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ /* Returns the median of three elements. */
+ static INLINE
+ int *
+ ss_median3(const unsigned char *Td, const int *PA,
+            int *v1, int *v2, int *v3) {
+   int *t;
+   if(Td[PA[*v1]] > Td[PA[*v2]]) { SWAP(v1, v2); }
+   if(Td[PA[*v2]] > Td[PA[*v3]]) {
+     if(Td[PA[*v1]] > Td[PA[*v3]]) { return v1; }
+     else { return v3; }
+   }
+   return v2;
+ }
+ 
+ /* Returns the median of five elements. */
+ static INLINE
+ int *
+ ss_median5(const unsigned char *Td, const int *PA,
+            int *v1, int *v2, int *v3, int *v4, int *v5) {
+   int *t;
+   if(Td[PA[*v2]] > Td[PA[*v3]]) { SWAP(v2, v3); }
+   if(Td[PA[*v4]] > Td[PA[*v5]]) { SWAP(v4, v5); }
+   if(Td[PA[*v2]] > Td[PA[*v4]]) { SWAP(v2, v4); SWAP(v3, v5); }
+   if(Td[PA[*v1]] > Td[PA[*v3]]) { SWAP(v1, v3); }
+   if(Td[PA[*v1]] > Td[PA[*v4]]) { SWAP(v1, v4); SWAP(v3, v5); }
+   if(Td[PA[*v3]] > Td[PA[*v4]]) { return v4; }
+   return v3;
+ }
+ 
+ /* Returns the pivot element. */
+ static INLINE
+ int *
+ ss_pivot(const unsigned char *Td, const int *PA, int *first, int *last) {
+   int *middle;
+   int t;
+ 
+   t = last - first;
+   middle = first + t / 2;
+ 
+   if(t <= 512) {
+     if(t <= 32) {
+       return ss_median3(Td, PA, first, middle, last - 1);
+     } else {
+       t >>= 2;
+       return ss_median5(Td, PA, first, first + t, middle, last - 1 - t, last - 1);
+     }
+   }
+   t >>= 3;
+   first  = ss_median3(Td, PA, first, first + t, first + (t << 1));
+   middle = ss_median3(Td, PA, middle - t, middle, middle + t);
+   last   = ss_median3(Td, PA, last - 1 - (t << 1), last - 1 - t, last - 1);
+   return ss_median3(Td, PA, first, middle, last);
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ /* Binary partition for substrings. */
+ static INLINE
+ int *
+ ss_partition(const int *PA,
+                     int *first, int *last, int depth) {
+   int *a, *b;
+   int t;
+   for(a = first - 1, b = last;;) {
+     for(; (++a < b) && ((PA[*a] + depth) >= (PA[*a + 1] + 1));) { *a = ~*a; }
+     for(; (a < --b) && ((PA[*b] + depth) <  (PA[*b + 1] + 1));) { }
+     if(b <= a) { break; }
+     t = ~*b;
+     *b = *a;
+     *a = t;
+   }
+   if(first < a) { *first = ~*first; }
+   return a;
+ }
+ 
+ /* Multikey introsort for medium size groups. */
+ static
+ void
+ ss_mintrosort(const unsigned char *T, const int *PA,
+               int *first, int *last,
+               int depth) {
+ #define STACK_SIZE SS_MISORT_STACKSIZE
+   struct { int *a, *b, c; int d; } stack[STACK_SIZE];
+   const unsigned char *Td;
+   int *a, *b, *c, *d, *e, *f;
+   int s, t;
+   int ssize;
+   int limit;
+   int v, x = 0;
+ 
+   for(ssize = 0, limit = ss_ilg(last - first);;) {
+ 
+     if((last - first) <= SS_INSERTIONSORT_THRESHOLD) {
+ #if 1 < SS_INSERTIONSORT_THRESHOLD
+       if(1 < (last - first)) { ss_insertionsort(T, PA, first, last, depth); }
+ #endif
+       STACK_POP(first, last, depth, limit);
+       continue;
+     }
+ 
+     Td = T + depth;
+     if(limit-- == 0) { ss_heapsort(Td, PA, first, last - first); }
+     if(limit < 0) {
+       for(a = first + 1, v = Td[PA[*first]]; a < last; ++a) {
+         if((x = Td[PA[*a]]) != v) {
+           if(1 < (a - first)) { break; }
+           v = x;
+           first = a;
+         }
+       }
+       if(Td[PA[*first] - 1] < v) {
+         first = ss_partition(PA, first, a, depth);
+       }
+       if((a - first) <= (last - a)) {
+         if(1 < (a - first)) {
+           STACK_PUSH(a, last, depth, -1);
+           last = a, depth += 1, limit = ss_ilg(a - first);
+         } else {
+           first = a, limit = -1;
+         }
+       } else {
+         if(1 < (last - a)) {
+           STACK_PUSH(first, a, depth + 1, ss_ilg(a - first));
+           first = a, limit = -1;
+         } else {
+           last = a, depth += 1, limit = ss_ilg(a - first);
+         }
+       }
+       continue;
+     }
+ 
+     /* choose pivot */
+     a = ss_pivot(Td, PA, first, last);
+     v = Td[PA[*a]];
+     SWAP(*first, *a);
+ 
+     /* partition */
+     for(b = first; (++b < last) && ((x = Td[PA[*b]]) == v);) { }
+     if(((a = b) < last) && (x < v)) {
+       for(; (++b < last) && ((x = Td[PA[*b]]) <= v);) {
+         if(x == v) { SWAP(*b, *a); ++a; }
+       }
+     }
+     for(c = last; (b < --c) && ((x = Td[PA[*c]]) == v);) { }
+     if((b < (d = c)) && (x > v)) {
+       for(; (b < --c) && ((x = Td[PA[*c]]) >= v);) {
+         if(x == v) { SWAP(*c, *d); --d; }
+       }
+     }
+     for(; b < c;) {
+       SWAP(*b, *c);
+       for(; (++b < c) && ((x = Td[PA[*b]]) <= v);) {
+         if(x == v) { SWAP(*b, *a); ++a; }
+       }
+       for(; (b < --c) && ((x = Td[PA[*c]]) >= v);) {
+         if(x == v) { SWAP(*c, *d); --d; }
+       }
+     }
+ 
+     if(a <= d) {
+       c = b - 1;
+ 
+       if((s = a - first) > (t = b - a)) { s = t; }
+       for(e = first, f = b - s; 0 < s; --s, ++e, ++f) { SWAP(*e, *f); }
+       if((s = d - c) > (t = last - d - 1)) { s = t; }
+       for(e = b, f = last - s; 0 < s; --s, ++e, ++f) { SWAP(*e, *f); }
+ 
+       a = first + (b - a), c = last - (d - c);
+       b = (v <= Td[PA[*a] - 1]) ? a : ss_partition(PA, a, c, depth);
+ 
+       if((a - first) <= (last - c)) {
+         if((last - c) <= (c - b)) {
+           STACK_PUSH(b, c, depth + 1, ss_ilg(c - b));
+           STACK_PUSH(c, last, depth, limit);
+           last = a;
+         } else if((a - first) <= (c - b)) {
+           STACK_PUSH(c, last, depth, limit);
+           STACK_PUSH(b, c, depth + 1, ss_ilg(c - b));
+           last = a;
+         } else {
+           STACK_PUSH(c, last, depth, limit);
+           STACK_PUSH(first, a, depth, limit);
+           first = b, last = c, depth += 1, limit = ss_ilg(c - b);
+         }
+       } else {
+         if((a - first) <= (c - b)) {
+           STACK_PUSH(b, c, depth + 1, ss_ilg(c - b));
+           STACK_PUSH(first, a, depth, limit);
+           first = c;
+         } else if((last - c) <= (c - b)) {
+           STACK_PUSH(first, a, depth, limit);
+           STACK_PUSH(b, c, depth + 1, ss_ilg(c - b));
+           first = c;
+         } else {
+           STACK_PUSH(first, a, depth, limit);
+           STACK_PUSH(c, last, depth, limit);
+           first = b, last = c, depth += 1, limit = ss_ilg(c - b);
+         }
+       }
+     } else {
+       limit += 1;
+       if(Td[PA[*first] - 1] < v) {
+         first = ss_partition(PA, first, last, depth);
+         limit = ss_ilg(last - first);
+       }
+       depth += 1;
+     }
+   }
+ #undef STACK_SIZE
+ }
+ 
+ #endif /* (SS_BLOCKSIZE == 0) || (SS_INSERTIONSORT_THRESHOLD < SS_BLOCKSIZE) */
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ #if SS_BLOCKSIZE != 0
+ 
+ static INLINE
+ void
+ ss_blockswap(int *a, int *b, int n) {
+   int t;
+   for(; 0 < n; --n, ++a, ++b) {
+     t = *a, *a = *b, *b = t;
+   }
+ }
+ 
+ static INLINE
+ void
+ ss_rotate(int *first, int *middle, int *last) {
+   int *a, *b, t;
+   int l, r;
+   l = middle - first, r = last - middle;
+   for(; (0 < l) && (0 < r);) {
+     if(l == r) { ss_blockswap(first, middle, l); break; }
+     if(l < r) {
+       a = last - 1, b = middle - 1;
+       t = *a;
+       do {
+         *a-- = *b, *b-- = *a;
+         if(b < first) {
+           *a = t;
+           last = a;
+           if((r -= l + 1) <= l) { break; }
+           a -= 1, b = middle - 1;
+           t = *a;
+         }
+       } while(1);
+     } else {
+       a = first, b = middle;
+       t = *a;
+       do {
+         *a++ = *b, *b++ = *a;
+         if(last <= b) {
+           *a = t;
+           first = a + 1;
+           if((l -= r + 1) <= r) { break; }
+           a += 1, b = middle;
+           t = *a;
+         }
+       } while(1);
+     }
+   }
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ static
+ void
+ ss_inplacemerge(const unsigned char *T, const int *PA,
+                 int *first, int *middle, int *last,
+                 int depth) {
+   const int *p;
+   int *a, *b;
+   int len, half;
+   int q, r;
+   int x;
+ 
+   for(;;) {
+     if(*(last - 1) < 0) { x = 1; p = PA + ~*(last - 1); }
+     else                { x = 0; p = PA +  *(last - 1); }
+     for(a = first, len = middle - first, half = len >> 1, r = -1;
+         0 < len;
+         len = half, half >>= 1) {
+       b = a + half;
+       q = ss_compare(T, PA + ((0 <= *b) ? *b : ~*b), p, depth);
+       if(q < 0) {
+         a = b + 1;
+         half -= (len & 1) ^ 1;
+       } else {
+         r = q;
+       }
+     }
+     if(a < middle) {
+       if(r == 0) { *a = ~*a; }
+       ss_rotate(a, middle, last);
+       last -= middle - a;
+       middle = a;
+       if(first == middle) { break; }
+     }
+     --last;
+     if(x != 0) { while(*--last < 0) { } }
+     if(middle == last) { break; }
+   }
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ /* Merge-forward with internal buffer. */
+ static
+ void
+ ss_mergeforward(const unsigned char *T, const int *PA,
+                 int *first, int *middle, int *last,
+                 int *buf, int depth) {
+   int *a, *b, *c, *bufend;
+   int t;
+   int r;
+ 
+   bufend = buf + (middle - first) - 1;
+   ss_blockswap(buf, first, middle - first);
+ 
+   for(t = *(a = first), b = buf, c = middle;;) {
+     r = ss_compare(T, PA + *b, PA + *c, depth);
+     if(r < 0) {
+       do {
+         *a++ = *b;
+         if(bufend <= b) { *bufend = t; return; }
+         *b++ = *a;
+       } while(*b < 0);
+     } else if(r > 0) {
+       do {
+         *a++ = *c, *c++ = *a;
+         if(last <= c) {
+           while(b < bufend) { *a++ = *b, *b++ = *a; }
+           *a = *b, *b = t;
+           return;
+         }
+       } while(*c < 0);
+     } else {
+       *c = ~*c;
+       do {
+         *a++ = *b;
+         if(bufend <= b) { *bufend = t; return; }
+         *b++ = *a;
+       } while(*b < 0);
+ 
+       do {
+         *a++ = *c, *c++ = *a;
+         if(last <= c) {
+           while(b < bufend) { *a++ = *b, *b++ = *a; }
+           *a = *b, *b = t;
+           return;
+         }
+       } while(*c < 0);
+     }
+   }
+ }
+ 
+ /* Merge-backward with internal buffer. */
+ static
+ void
+ ss_mergebackward(const unsigned char *T, const int *PA,
+                  int *first, int *middle, int *last,
+                  int *buf, int depth) {
+   const int *p1, *p2;
+   int *a, *b, *c, *bufend;
+   int t;
+   int r;
+   int x;
+ 
+   bufend = buf + (last - middle) - 1;
+   ss_blockswap(buf, middle, last - middle);
+ 
+   x = 0;
+   if(*bufend < 0)       { p1 = PA + ~*bufend; x |= 1; }
+   else                  { p1 = PA +  *bufend; }
+   if(*(middle - 1) < 0) { p2 = PA + ~*(middle - 1); x |= 2; }
+   else                  { p2 = PA +  *(middle - 1); }
+   for(t = *(a = last - 1), b = bufend, c = middle - 1;;) {
+     r = ss_compare(T, p1, p2, depth);
+     if(0 < r) {
+       if(x & 1) { do { *a-- = *b, *b-- = *a; } while(*b < 0); x ^= 1; }
+       *a-- = *b;
+       if(b <= buf) { *buf = t; break; }
+       *b-- = *a;
+       if(*b < 0) { p1 = PA + ~*b; x |= 1; }
+       else       { p1 = PA +  *b; }
+     } else if(r < 0) {
+       if(x & 2) { do { *a-- = *c, *c-- = *a; } while(*c < 0); x ^= 2; }
+       *a-- = *c, *c-- = *a;
+       if(c < first) {
+         while(buf < b) { *a-- = *b, *b-- = *a; }
+         *a = *b, *b = t;
+         break;
+       }
+       if(*c < 0) { p2 = PA + ~*c; x |= 2; }
+       else       { p2 = PA +  *c; }
+     } else {
+       if(x & 1) { do { *a-- = *b, *b-- = *a; } while(*b < 0); x ^= 1; }
+       *a-- = ~*b;
+       if(b <= buf) { *buf = t; break; }
+       *b-- = *a;
+       if(x & 2) { do { *a-- = *c, *c-- = *a; } while(*c < 0); x ^= 2; }
+       *a-- = *c, *c-- = *a;
+       if(c < first) {
+         while(buf < b) { *a-- = *b, *b-- = *a; }
+         *a = *b, *b = t;
+         break;
+       }
+       if(*b < 0) { p1 = PA + ~*b; x |= 1; }
+       else       { p1 = PA +  *b; }
+       if(*c < 0) { p2 = PA + ~*c; x |= 2; }
+       else       { p2 = PA +  *c; }
+     }
+   }
+ }
+ 
+ /* D&C based merge. */
+ static
+ void
+ ss_swapmerge(const unsigned char *T, const int *PA,
+              int *first, int *middle, int *last,
+              int *buf, int bufsize, int depth) {
+ #define STACK_SIZE SS_SMERGE_STACKSIZE
+ #define GETIDX(a) ((0 <= (a)) ? (a) : (~(a)))
+ #define MERGE_CHECK(a, b, c)\
+   do {\
+     if(((c) & 1) ||\
+        (((c) & 2) && (ss_compare(T, PA + GETIDX(*((a) - 1)), PA + *(a), depth) == 0))) {\
+       *(a) = ~*(a);\
+     }\
+     if(((c) & 4) && ((ss_compare(T, PA + GETIDX(*((b) - 1)), PA + *(b), depth) == 0))) {\
+       *(b) = ~*(b);\
+     }\
+   } while(0)
+   struct { int *a, *b, *c; int d; } stack[STACK_SIZE];
+   int *l, *r, *lm, *rm;
+   int m, len, half;
+   int ssize;
+   int check, next;
+ 
+   for(check = 0, ssize = 0;;) {
+     if((last - middle) <= bufsize) {
+       if((first < middle) && (middle < last)) {
+         ss_mergebackward(T, PA, first, middle, last, buf, depth);
+       }
+       MERGE_CHECK(first, last, check);
+       STACK_POP(first, middle, last, check);
+       continue;
+     }
+ 
+     if((middle - first) <= bufsize) {
+       if(first < middle) {
+         ss_mergeforward(T, PA, first, middle, last, buf, depth);
+       }
+       MERGE_CHECK(first, last, check);
+       STACK_POP(first, middle, last, check);
+       continue;
+     }
+ 
+     for(m = 0, len = MIN(middle - first, last - middle), half = len >> 1;
+         0 < len;
+         len = half, half >>= 1) {
+       if(ss_compare(T, PA + GETIDX(*(middle + m + half)),
+                        PA + GETIDX(*(middle - m - half - 1)), depth) < 0) {
+         m += half + 1;
+         half -= (len & 1) ^ 1;
+       }
+     }
+ 
+     if(0 < m) {
+       lm = middle - m, rm = middle + m;
+       ss_blockswap(lm, middle, m);
+       l = r = middle, next = 0;
+       if(rm < last) {
+         if(*rm < 0) {
+           *rm = ~*rm;
+           if(first < lm) { for(; *--l < 0;) { } next |= 4; }
+           next |= 1;
+         } else if(first < lm) {
+           for(; *r < 0; ++r) { }
+           next |= 2;
+         }
+       }
+ 
+       if((l - first) <= (last - r)) {
+         STACK_PUSH(r, rm, last, (next & 3) | (check & 4));
+         middle = lm, last = l, check = (check & 3) | (next & 4);
+       } else {
+         if((next & 2) && (r == middle)) { next ^= 6; }
+         STACK_PUSH(first, lm, l, (check & 3) | (next & 4));
+         first = r, middle = rm, check = (next & 3) | (check & 4);
+       }
+     } else {
+       if(ss_compare(T, PA + GETIDX(*(middle - 1)), PA + *middle, depth) == 0) {
+         *middle = ~*middle;
+       }
+       MERGE_CHECK(first, last, check);
+       STACK_POP(first, middle, last, check);
+     }
+   }
+ #undef STACK_SIZE
+ }
+ 
+ #endif /* SS_BLOCKSIZE != 0 */
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ /* Substring sort */
+ static
+ void
+ sssort(const unsigned char *T, const int *PA,
+        int *first, int *last,
+        int *buf, int bufsize,
+        int depth, int n, int lastsuffix) {
+   int *a;
+ #if SS_BLOCKSIZE != 0
+   int *b, *middle, *curbuf;
+   int j, k, curbufsize, limit;
+ #endif
+   int i;
+ 
+   if(lastsuffix != 0) { ++first; }
+ 
+ #if SS_BLOCKSIZE == 0
+   ss_mintrosort(T, PA, first, last, depth);
+ #else
+   if((bufsize < SS_BLOCKSIZE) &&
+       (bufsize < (last - first)) &&
+       (bufsize < (limit = ss_isqrt(last - first)))) {
+     if(SS_BLOCKSIZE < limit) { limit = SS_BLOCKSIZE; }
+     buf = middle = last - limit, bufsize = limit;
+   } else {
+     middle = last, limit = 0;
+   }
+   for(a = first, i = 0; SS_BLOCKSIZE < (middle - a); a += SS_BLOCKSIZE, ++i) {
+ #if SS_INSERTIONSORT_THRESHOLD < SS_BLOCKSIZE
+     ss_mintrosort(T, PA, a, a + SS_BLOCKSIZE, depth);
+ #elif 1 < SS_BLOCKSIZE
+     ss_insertionsort(T, PA, a, a + SS_BLOCKSIZE, depth);
+ #endif
+     curbufsize = last - (a + SS_BLOCKSIZE);
+     curbuf = a + SS_BLOCKSIZE;
+     if(curbufsize <= bufsize) { curbufsize = bufsize, curbuf = buf; }
+     for(b = a, k = SS_BLOCKSIZE, j = i; j & 1; b -= k, k <<= 1, j >>= 1) {
+       ss_swapmerge(T, PA, b - k, b, b + k, curbuf, curbufsize, depth);
+     }
+   }
+ #if SS_INSERTIONSORT_THRESHOLD < SS_BLOCKSIZE
+   ss_mintrosort(T, PA, a, middle, depth);
+ #elif 1 < SS_BLOCKSIZE
+   ss_insertionsort(T, PA, a, middle, depth);
+ #endif
+   for(k = SS_BLOCKSIZE; i != 0; k <<= 1, i >>= 1) {
+     if(i & 1) {
+       ss_swapmerge(T, PA, a - k, a, middle, buf, bufsize, depth);
+       a -= k;
+     }
+   }
+   if(limit != 0) {
+ #if SS_INSERTIONSORT_THRESHOLD < SS_BLOCKSIZE
+     ss_mintrosort(T, PA, middle, last, depth);
+ #elif 1 < SS_BLOCKSIZE
+     ss_insertionsort(T, PA, middle, last, depth);
+ #endif
+     ss_inplacemerge(T, PA, first, middle, last, depth);
+   }
+ #endif
+ 
+   if(lastsuffix != 0) {
+     /* Insert last type B* suffix. */
+     int PAi[2]; PAi[0] = PA[*(first - 1)], PAi[1] = n - 2;
+     for(a = first, i = *(first - 1);
+         (a < last) && ((*a < 0) || (0 < ss_compare(T, &(PAi[0]), PA + *a, depth)));
+         ++a) {
+       *(a - 1) = *a;
+     }
+     *(a - 1) = i;
+   }
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ static INLINE
+ int
+ tr_ilg(int n) {
+   return (n & 0xffff0000) ?
+           ((n & 0xff000000) ?
+             24 + lg_table[(n >> 24) & 0xff] :
+             16 + lg_table[(n >> 16) & 0xff]) :
+           ((n & 0x0000ff00) ?
+              8 + lg_table[(n >>  8) & 0xff] :
+              0 + lg_table[(n >>  0) & 0xff]);
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ /* Simple insertionsort for small size groups. */
+ static
+ void
+ tr_insertionsort(const int *ISAd, int *first, int *last) {
+   int *a, *b;
+   int t, r;
+ 
+   for(a = first + 1; a < last; ++a) {
+     for(t = *a, b = a - 1; 0 > (r = ISAd[t] - ISAd[*b]);) {
+       do { *(b + 1) = *b; } while((first <= --b) && (*b < 0));
+       if(b < first) { break; }
+     }
+     if(r == 0) { *b = ~*b; }
+     *(b + 1) = t;
+   }
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ static INLINE
+ void
+ tr_fixdown(const int *ISAd, int *SA, int i, int size) {
+   int j, k;
+   int v;
+   int c, d, e;
+ 
+   for(v = SA[i], c = ISAd[v]; (j = 2 * i + 1) < size; SA[i] = SA[k], i = k) {
+     d = ISAd[SA[k = j++]];
+     if(d < (e = ISAd[SA[j]])) { k = j; d = e; }
+     if(d <= c) { break; }
+   }
+   SA[i] = v;
+ }
+ 
+ /* Simple top-down heapsort. */
+ static
+ void
+ tr_heapsort(const int *ISAd, int *SA, int size) {
+   int i, m;
+   int t;
+ 
+   m = size;
+   if((size % 2) == 0) {
+     m--;
+     if(ISAd[SA[m / 2]] < ISAd[SA[m]]) { SWAP(SA[m], SA[m / 2]); }
+   }
+ 
+   for(i = m / 2 - 1; 0 <= i; --i) { tr_fixdown(ISAd, SA, i, m); }
+   if((size % 2) == 0) { SWAP(SA[0], SA[m]); tr_fixdown(ISAd, SA, 0, m); }
+   for(i = m - 1; 0 < i; --i) {
+     t = SA[0], SA[0] = SA[i];
+     tr_fixdown(ISAd, SA, 0, i);
+     SA[i] = t;
+   }
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ /* Returns the median of three elements. */
+ static INLINE
+ int *
+ tr_median3(const int *ISAd, int *v1, int *v2, int *v3) {
+   int *t;
+   if(ISAd[*v1] > ISAd[*v2]) { SWAP(v1, v2); }
+   if(ISAd[*v2] > ISAd[*v3]) {
+     if(ISAd[*v1] > ISAd[*v3]) { return v1; }
+     else { return v3; }
+   }
+   return v2;
+ }
+ 
+ /* Returns the median of five elements. */
+ static INLINE
+ int *
+ tr_median5(const int *ISAd,
+            int *v1, int *v2, int *v3, int *v4, int *v5) {
+   int *t;
+   if(ISAd[*v2] > ISAd[*v3]) { SWAP(v2, v3); }
+   if(ISAd[*v4] > ISAd[*v5]) { SWAP(v4, v5); }
+   if(ISAd[*v2] > ISAd[*v4]) { SWAP(v2, v4); SWAP(v3, v5); }
+   if(ISAd[*v1] > ISAd[*v3]) { SWAP(v1, v3); }
+   if(ISAd[*v1] > ISAd[*v4]) { SWAP(v1, v4); SWAP(v3, v5); }
+   if(ISAd[*v3] > ISAd[*v4]) { return v4; }
+   return v3;
+ }
+ 
+ /* Returns the pivot element. */
+ static INLINE
+ int *
+ tr_pivot(const int *ISAd, int *first, int *last) {
+   int *middle;
+   int t;
+ 
+   t = last - first;
+   middle = first + t / 2;
+ 
+   if(t <= 512) {
+     if(t <= 32) {
+       return tr_median3(ISAd, first, middle, last - 1);
+     } else {
+       t >>= 2;
+       return tr_median5(ISAd, first, first + t, middle, last - 1 - t, last - 1);
+     }
+   }
+   t >>= 3;
+   first  = tr_median3(ISAd, first, first + t, first + (t << 1));
+   middle = tr_median3(ISAd, middle - t, middle, middle + t);
+   last   = tr_median3(ISAd, last - 1 - (t << 1), last - 1 - t, last - 1);
+   return tr_median3(ISAd, first, middle, last);
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ typedef struct _trbudget_t trbudget_t;
+ struct _trbudget_t {
+   int chance;
+   int remain;
+   int incval;
+   int count;
+ };
+ 
+ static INLINE
+ void
+ trbudget_init(trbudget_t *budget, int chance, int incval) {
+   budget->chance = chance;
+   budget->remain = budget->incval = incval;
+ }
+ 
+ static INLINE
+ int
+ trbudget_check(trbudget_t *budget, int size) {
+   if(size <= budget->remain) { budget->remain -= size; return 1; }
+   if(budget->chance == 0) { budget->count += size; return 0; }
+   budget->remain += budget->incval - size;
+   budget->chance -= 1;
+   return 1;
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ static INLINE
+ void
+ tr_partition(const int *ISAd,
+              int *first, int *middle, int *last,
+              int **pa, int **pb, int v) {
+   int *a, *b, *c, *d, *e, *f;
+   int t, s;
+   int x = 0;
+ 
+   for(b = middle - 1; (++b < last) && ((x = ISAd[*b]) == v);) { }
+   if(((a = b) < last) && (x < v)) {
+     for(; (++b < last) && ((x = ISAd[*b]) <= v);) {
+       if(x == v) { SWAP(*b, *a); ++a; }
+     }
+   }
+   for(c = last; (b < --c) && ((x = ISAd[*c]) == v);) { }
+   if((b < (d = c)) && (x > v)) {
+     for(; (b < --c) && ((x = ISAd[*c]) >= v);) {
+       if(x == v) { SWAP(*c, *d); --d; }
+     }
+   }
+   for(; b < c;) {
+     SWAP(*b, *c);
+     for(; (++b < c) && ((x = ISAd[*b]) <= v);) {
+       if(x == v) { SWAP(*b, *a); ++a; }
+     }
+     for(; (b < --c) && ((x = ISAd[*c]) >= v);) {
+       if(x == v) { SWAP(*c, *d); --d; }
+     }
+   }
+ 
+   if(a <= d) {
+     c = b - 1;
+     if((s = a - first) > (t = b - a)) { s = t; }
+     for(e = first, f = b - s; 0 < s; --s, ++e, ++f) { SWAP(*e, *f); }
+     if((s = d - c) > (t = last - d - 1)) { s = t; }
+     for(e = b, f = last - s; 0 < s; --s, ++e, ++f) { SWAP(*e, *f); }
+     first += (b - a), last -= (d - c);
+   }
+   *pa = first, *pb = last;
+ }
+ 
+ static
+ void
+ tr_copy(int *ISA, const int *SA,
+         int *first, int *a, int *b, int *last,
+         int depth) {
+   /* sort suffixes of middle partition
+      by using sorted order of suffixes of left and right partition. */
+   int *c, *d, *e;
+   int s, v;
+ 
+   v = b - SA - 1;
+   for(c = first, d = a - 1; c <= d; ++c) {
+     if((0 <= (s = *c - depth)) && (ISA[s] == v)) {
+       *++d = s;
+       ISA[s] = d - SA;
+     }
+   }
+   for(c = last - 1, e = d + 1, d = b; e < d; --c) {
+     if((0 <= (s = *c - depth)) && (ISA[s] == v)) {
+       *--d = s;
+       ISA[s] = d - SA;
+     }
+   }
+ }
+ 
+ static
+ void
+ tr_partialcopy(int *ISA, const int *SA,
+                int *first, int *a, int *b, int *last,
+                int depth) {
+   int *c, *d, *e;
+   int s, v;
+   int rank, lastrank, newrank = -1;
+ 
+   v = b - SA - 1;
+   lastrank = -1;
+   for(c = first, d = a - 1; c <= d; ++c) {
+     if((0 <= (s = *c - depth)) && (ISA[s] == v)) {
+       *++d = s;
+       rank = ISA[s + depth];
+       if(lastrank != rank) { lastrank = rank; newrank = d - SA; }
+       ISA[s] = newrank;
+     }
+   }
+ 
+   lastrank = -1;
+   for(e = d; first <= e; --e) {
+     rank = ISA[*e];
+     if(lastrank != rank) { lastrank = rank; newrank = e - SA; }
+     if(newrank != rank) { ISA[*e] = newrank; }
+   }
+ 
+   lastrank = -1;
+   for(c = last - 1, e = d + 1, d = b; e < d; --c) {
+     if((0 <= (s = *c - depth)) && (ISA[s] == v)) {
+       *--d = s;
+       rank = ISA[s + depth];
+       if(lastrank != rank) { lastrank = rank; newrank = d - SA; }
+       ISA[s] = newrank;
+     }
+   }
+ }
+ 
+ static
+ void
+ tr_introsort(int *ISA, const int *ISAd,
+              int *SA, int *first, int *last,
+              trbudget_t *budget) {
+ #define STACK_SIZE TR_STACKSIZE
+   struct { const int *a; int *b, *c; int d, e; }stack[STACK_SIZE];
+   int *a, *b, *c;
+   int t;
+   int v, x = 0;
+   int incr = ISAd - ISA;
+   int limit, next;
+   int ssize, trlink = -1;
+ 
+   for(ssize = 0, limit = tr_ilg(last - first);;) {
+ 
+     if(limit < 0) {
+       if(limit == -1) {
+         /* tandem repeat partition */
+         tr_partition(ISAd - incr, first, first, last, &a, &b, last - SA - 1);
+ 
+         /* update ranks */
+         if(a < last) {
+           for(c = first, v = a - SA - 1; c < a; ++c) { ISA[*c] = v; }
+         }
+         if(b < last) {
+           for(c = a, v = b - SA - 1; c < b; ++c) { ISA[*c] = v; }
+         }
+ 
+         /* push */
+         if(1 < (b - a)) {
+           STACK_PUSH5(NULL, a, b, 0, 0);
+           STACK_PUSH5(ISAd - incr, first, last, -2, trlink);
+           trlink = ssize - 2;
+         }
+         if((a - first) <= (last - b)) {
+           if(1 < (a - first)) {
+             STACK_PUSH5(ISAd, b, last, tr_ilg(last - b), trlink);
+             last = a, limit = tr_ilg(a - first);
+           } else if(1 < (last - b)) {
+             first = b, limit = tr_ilg(last - b);
+           } else {
+             STACK_POP5(ISAd, first, last, limit, trlink);
+           }
+         } else {
+           if(1 < (last - b)) {
+             STACK_PUSH5(ISAd, first, a, tr_ilg(a - first), trlink);
+             first = b, limit = tr_ilg(last - b);
+           } else if(1 < (a - first)) {
+             last = a, limit = tr_ilg(a - first);
+           } else {
+             STACK_POP5(ISAd, first, last, limit, trlink);
+           }
+         }
+       } else if(limit == -2) {
+         /* tandem repeat copy */
+         a = stack[--ssize].b, b = stack[ssize].c;
+         if(stack[ssize].d == 0) {
+           tr_copy(ISA, SA, first, a, b, last, ISAd - ISA);
+         } else {
+           if(0 <= trlink) { stack[trlink].d = -1; }
+           tr_partialcopy(ISA, SA, first, a, b, last, ISAd - ISA);
+         }
+         STACK_POP5(ISAd, first, last, limit, trlink);
+       } else {
+         /* sorted partition */
+         if(0 <= *first) {
+           a = first;
+           do { ISA[*a] = a - SA; } while((++a < last) && (0 <= *a));
+           first = a;
+         }
+         if(first < last) {
+           a = first; do { *a = ~*a; } while(*++a < 0);
+           next = (ISA[*a] != ISAd[*a]) ? tr_ilg(a - first + 1) : -1;
+           if(++a < last) { for(b = first, v = a - SA - 1; b < a; ++b) { ISA[*b] = v; } }
+ 
+           /* push */
+           if(trbudget_check(budget, a - first)) {
+             if((a - first) <= (last - a)) {
+               STACK_PUSH5(ISAd, a, last, -3, trlink);
+               ISAd += incr, last = a, limit = next;
+             } else {
+               if(1 < (last - a)) {
+                 STACK_PUSH5(ISAd + incr, first, a, next, trlink);
+                 first = a, limit = -3;
+               } else {
+                 ISAd += incr, last = a, limit = next;
+               }
+             }
+           } else {
+             if(0 <= trlink) { stack[trlink].d = -1; }
+             if(1 < (last - a)) {
+               first = a, limit = -3;
+             } else {
+               STACK_POP5(ISAd, first, last, limit, trlink);
+             }
+           }
+         } else {
+           STACK_POP5(ISAd, first, last, limit, trlink);
+         }
+       }
+       continue;
+     }
+ 
+     if((last - first) <= TR_INSERTIONSORT_THRESHOLD) {
+       tr_insertionsort(ISAd, first, last);
+       limit = -3;
+       continue;
+     }
+ 
+     if(limit-- == 0) {
+       tr_heapsort(ISAd, first, last - first);
+       for(a = last - 1; first < a; a = b) {
+         for(x = ISAd[*a], b = a - 1; (first <= b) && (ISAd[*b] == x); --b) { *b = ~*b; }
+       }
+       limit = -3;
+       continue;
+     }
+ 
+     /* choose pivot */
+     a = tr_pivot(ISAd, first, last);
+     SWAP(*first, *a);
+     v = ISAd[*first];
+ 
+     /* partition */
+     tr_partition(ISAd, first, first + 1, last, &a, &b, v);
+     if((last - first) != (b - a)) {
+       next = (ISA[*a] != v) ? tr_ilg(b - a) : -1;
+ 
+       /* update ranks */
+       for(c = first, v = a - SA - 1; c < a; ++c) { ISA[*c] = v; }
+       if(b < last) { for(c = a, v = b - SA - 1; c < b; ++c) { ISA[*c] = v; } }
+ 
+       /* push */
+       if((1 < (b - a)) && (trbudget_check(budget, b - a))) {
+         if((a - first) <= (last - b)) {
+           if((last - b) <= (b - a)) {
+             if(1 < (a - first)) {
+               STACK_PUSH5(ISAd + incr, a, b, next, trlink);
+               STACK_PUSH5(ISAd, b, last, limit, trlink);
+               last = a;
+             } else if(1 < (last - b)) {
+               STACK_PUSH5(ISAd + incr, a, b, next, trlink);
+               first = b;
+             } else {
+               ISAd += incr, first = a, last = b, limit = next;
+             }
+           } else if((a - first) <= (b - a)) {
+             if(1 < (a - first)) {
+               STACK_PUSH5(ISAd, b, last, limit, trlink);
+               STACK_PUSH5(ISAd + incr, a, b, next, trlink);
+               last = a;
+             } else {
+               STACK_PUSH5(ISAd, b, last, limit, trlink);
+               ISAd += incr, first = a, last = b, limit = next;
+             }
+           } else {
+             STACK_PUSH5(ISAd, b, last, limit, trlink);
+             STACK_PUSH5(ISAd, first, a, limit, trlink);
+             ISAd += incr, first = a, last = b, limit = next;
+           }
+         } else {
+           if((a - first) <= (b - a)) {
+             if(1 < (last - b)) {
+               STACK_PUSH5(ISAd + incr, a, b, next, trlink);
+               STACK_PUSH5(ISAd, first, a, limit, trlink);
+               first = b;
+             } else if(1 < (a - first)) {
+               STACK_PUSH5(ISAd + incr, a, b, next, trlink);
+               last = a;
+             } else {
+               ISAd += incr, first = a, last = b, limit = next;
+             }
+           } else if((last - b) <= (b - a)) {
+             if(1 < (last - b)) {
+               STACK_PUSH5(ISAd, first, a, limit, trlink);
+               STACK_PUSH5(ISAd + incr, a, b, next, trlink);
+               first = b;
+             } else {
+               STACK_PUSH5(ISAd, first, a, limit, trlink);
+               ISAd += incr, first = a, last = b, limit = next;
+             }
+           } else {
+             STACK_PUSH5(ISAd, first, a, limit, trlink);
+             STACK_PUSH5(ISAd, b, last, limit, trlink);
+             ISAd += incr, first = a, last = b, limit = next;
+           }
+         }
+       } else {
+         if((1 < (b - a)) && (0 <= trlink)) { stack[trlink].d = -1; }
+         if((a - first) <= (last - b)) {
+           if(1 < (a - first)) {
+             STACK_PUSH5(ISAd, b, last, limit, trlink);
+             last = a;
+           } else if(1 < (last - b)) {
+             first = b;
+           } else {
+             STACK_POP5(ISAd, first, last, limit, trlink);
+           }
+         } else {
+           if(1 < (last - b)) {
+             STACK_PUSH5(ISAd, first, a, limit, trlink);
+             first = b;
+           } else if(1 < (a - first)) {
+             last = a;
+           } else {
+             STACK_POP5(ISAd, first, last, limit, trlink);
+           }
+         }
+       }
+     } else {
+       if(trbudget_check(budget, last - first)) {
+         limit = tr_ilg(last - first), ISAd += incr;
+       } else {
+         if(0 <= trlink) { stack[trlink].d = -1; }
+         STACK_POP5(ISAd, first, last, limit, trlink);
+       }
+     }
+   }
+ #undef STACK_SIZE
+ }
+ 
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ /* Tandem repeat sort */
+ static
+ void
+ trsort(int *ISA, int *SA, int n, int depth) {
+   int *ISAd;
+   int *first, *last;
+   trbudget_t budget;
+   int t, skip, unsorted;
+ 
+   trbudget_init(&budget, tr_ilg(n) * 2 / 3, n);
+ /*  trbudget_init(&budget, tr_ilg(n) * 3 / 4, n); */
+   for(ISAd = ISA + depth; -n < *SA; ISAd += ISAd - ISA) {
+     first = SA;
+     skip = 0;
+     unsorted = 0;
+     do {
+       if((t = *first) < 0) { first -= t; skip += t; }
+       else {
+         if(skip != 0) { *(first + skip) = skip; skip = 0; }
+         last = SA + ISA[t] + 1;
+         if(1 < (last - first)) {
+           budget.count = 0;
+           tr_introsort(ISA, ISAd, SA, first, last, &budget);
+           if(budget.count != 0) { unsorted += budget.count; }
+           else { skip = first - last; }
+         } else if((last - first) == 1) {
+           skip = -1;
+         }
+         first = last;
+       }
+     } while(first < (SA + n));
+     if(skip != 0) { *(first + skip) = skip; }
+     if(unsorted == 0) { break; }
+   }
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ /* Sorts suffixes of type B*. */
+ static
+ int
+ sort_typeBstar(const unsigned char *T, int *SA,
+                int *bucket_A, int *bucket_B,
+                int n, int openMP) {
+   int *PAb, *ISAb, *buf;
+ #ifdef LIBBSC_OPENMP
+   int *curbuf;
+   int l;
+ #endif
+   int i, j, k, t, m, bufsize;
+   int c0, c1;
+ #ifdef LIBBSC_OPENMP
+   int d0, d1;
+ #endif
+   (void)openMP;
+ 
+   /* Initialize bucket arrays. */
+   for(i = 0; i < BUCKET_A_SIZE; ++i) { bucket_A[i] = 0; }
+   for(i = 0; i < BUCKET_B_SIZE; ++i) { bucket_B[i] = 0; }
+ 
+   /* Count the number of occurrences of the first one or two characters of each
+      type A, B and B* suffix. Moreover, store the beginning position of all
+      type B* suffixes into the array SA. */
+   for(i = n - 1, m = n, c0 = T[n - 1]; 0 <= i;) {
+     /* type A suffix. */
+     do { ++BUCKET_A(c1 = c0); } while((0 <= --i) && ((c0 = T[i]) >= c1));
+     if(0 <= i) {
+       /* type B* suffix. */
+       ++BUCKET_BSTAR(c0, c1);
+       SA[--m] = i;
+       /* type B suffix. */
+       for(--i, c1 = c0; (0 <= i) && ((c0 = T[i]) <= c1); --i, c1 = c0) {
+         ++BUCKET_B(c0, c1);
+       }
+     }
+   }
+   m = n - m;
+ /*
+ note:
+   A type B* suffix is lexicographically smaller than a type B suffix that
+   begins with the same first two characters.
+ */
+ 
+   /* Calculate the index of start/end point of each bucket. */
+   for(c0 = 0, i = 0, j = 0; c0 < ALPHABET_SIZE; ++c0) {
+     t = i + BUCKET_A(c0);
+     BUCKET_A(c0) = i + j; /* start point */
+     i = t + BUCKET_B(c0, c0);
+     for(c1 = c0 + 1; c1 < ALPHABET_SIZE; ++c1) {
+       j += BUCKET_BSTAR(c0, c1);
+       BUCKET_BSTAR(c0, c1) = j; /* end point */
+       i += BUCKET_B(c0, c1);
+     }
+   }
+ 
+   if(0 < m) {
+     /* Sort the type B* suffixes by their first two characters. */
+     PAb = SA + n - m; ISAb = SA + m;
+     for(i = m - 2; 0 <= i; --i) {
+       t = PAb[i], c0 = T[t], c1 = T[t + 1];
+       SA[--BUCKET_BSTAR(c0, c1)] = i;
+     }
+     t = PAb[m - 1], c0 = T[t], c1 = T[t + 1];
+     SA[--BUCKET_BSTAR(c0, c1)] = m - 1;
+ 
+     /* Sort the type B* substrings using sssort. */
+ #ifdef LIBBSC_OPENMP
+     if (openMP)
+     {
+         buf = SA + m;
+         c0 = ALPHABET_SIZE - 2, c1 = ALPHABET_SIZE - 1, j = m;
+ #pragma omp parallel default(shared) private(bufsize, curbuf, k, l, d0, d1)
+         {
+           bufsize = (n - (2 * m)) / omp_get_num_threads();
+           curbuf = buf + omp_get_thread_num() * bufsize;
+           k = 0;
+           for(;;) {
+             #pragma omp critical(sssort_lock)
+             {
+               if(0 < (l = j)) {
+                 d0 = c0, d1 = c1;
+                 do {
+                   k = BUCKET_BSTAR(d0, d1);
+                   if(--d1 <= d0) {
+                     d1 = ALPHABET_SIZE - 1;
+                     if(--d0 < 0) { break; }
+                   }
+                 } while(((l - k) <= 1) && (0 < (l = k)));
+                 c0 = d0, c1 = d1, j = k;
+               }
+             }
+             if(l == 0) { break; }
+             sssort(T, PAb, SA + k, SA + l,
+                    curbuf, bufsize, 2, n, *(SA + k) == (m - 1));
+           }
+         }
+     }
+     else
+     {
+         buf = SA + m, bufsize = n - (2 * m);
+         for(c0 = ALPHABET_SIZE - 2, j = m; 0 < j; --c0) {
+           for(c1 = ALPHABET_SIZE - 1; c0 < c1; j = i, --c1) {
+             i = BUCKET_BSTAR(c0, c1);
+             if(1 < (j - i)) {
+               sssort(T, PAb, SA + i, SA + j,
+                      buf, bufsize, 2, n, *(SA + i) == (m - 1));
+             }
+           }
+         }
+     }
+ #else
+     buf = SA + m, bufsize = n - (2 * m);
+     for(c0 = ALPHABET_SIZE - 2, j = m; 0 < j; --c0) {
+       for(c1 = ALPHABET_SIZE - 1; c0 < c1; j = i, --c1) {
+         i = BUCKET_BSTAR(c0, c1);
+         if(1 < (j - i)) {
+           sssort(T, PAb, SA + i, SA + j,
+                  buf, bufsize, 2, n, *(SA + i) == (m - 1));
+         }
+       }
+     }
+ #endif
+ 
+     /* Compute ranks of type B* substrings. */
+     for(i = m - 1; 0 <= i; --i) {
+       if(0 <= SA[i]) {
+         j = i;
+         do { ISAb[SA[i]] = i; } while((0 <= --i) && (0 <= SA[i]));
+         SA[i + 1] = i - j;
+         if(i <= 0) { break; }
+       }
+       j = i;
+       do { ISAb[SA[i] = ~SA[i]] = j; } while(SA[--i] < 0);
+       ISAb[SA[i]] = j;
+     }
+ 
+     /* Construct the inverse suffix array of type B* suffixes using trsort. */
+     trsort(ISAb, SA, m, 1);
+ 
+     /* Set the sorted order of tyoe B* suffixes. */
+     for(i = n - 1, j = m, c0 = T[n - 1]; 0 <= i;) {
+       for(--i, c1 = c0; (0 <= i) && ((c0 = T[i]) >= c1); --i, c1 = c0) { }
+       if(0 <= i) {
+         t = i;
+         for(--i, c1 = c0; (0 <= i) && ((c0 = T[i]) <= c1); --i, c1 = c0) { }
+         SA[ISAb[--j]] = ((t == 0) || (1 < (t - i))) ? t : ~t;
+       }
+     }
+ 
+     /* Calculate the index of start/end point of each bucket. */
+     BUCKET_B(ALPHABET_SIZE - 1, ALPHABET_SIZE - 1) = n; /* end point */
+     for(c0 = ALPHABET_SIZE - 2, k = m - 1; 0 <= c0; --c0) {
+       i = BUCKET_A(c0 + 1) - 1;
+       for(c1 = ALPHABET_SIZE - 1; c0 < c1; --c1) {
+         t = i - BUCKET_B(c0, c1);
+         BUCKET_B(c0, c1) = i; /* end point */
+ 
+         /* Move all type B* suffixes to the correct position. */
+         for(i = t, j = BUCKET_BSTAR(c0, c1);
+             j <= k;
+             --i, --k) { SA[i] = SA[k]; }
+       }
+       BUCKET_BSTAR(c0, c0 + 1) = i - BUCKET_B(c0, c0) + 1; /* start point */
+       BUCKET_B(c0, c0) = i; /* end point */
+     }
+   }
+ 
+   return m;
+ }
+ 
+ /* Constructs the suffix array by using the sorted order of type B* suffixes. */
+ static
+ void
+ construct_SA(const unsigned char *T, int *SA,
+              int *bucket_A, int *bucket_B,
+              int n, int m) {
+   int *i, *j, *k;
+   int s;
+   int c0, c1, c2;
+ 
+   if(0 < m) {
+     /* Construct the sorted order of type B suffixes by using
+        the sorted order of type B* suffixes. */
+     for(c1 = ALPHABET_SIZE - 2; 0 <= c1; --c1) {
+       /* Scan the suffix array from right to left. */
+       for(i = SA + BUCKET_BSTAR(c1, c1 + 1),
+           j = SA + BUCKET_A(c1 + 1) - 1, k = NULL, c2 = -1;
+           i <= j;
+           --j) {
+         if(0 < (s = *j)) {
+           assert(T[s] == c1);
+           assert(((s + 1) < n) && (T[s] <= T[s + 1]));
+           assert(T[s - 1] <= T[s]);
+           *j = ~s;
+           c0 = T[--s];
+           if((0 < s) && (T[s - 1] > c0)) { s = ~s; }
+           if(c0 != c2) {
+             if(0 <= c2) { BUCKET_B(c2, c1) = k - SA; }
+             k = SA + BUCKET_B(c2 = c0, c1);
+           }
+           assert(k < j); assert(k != NULL);
+           *k-- = s;
+         } else {
+           assert(((s == 0) && (T[s] == c1)) || (s < 0));
+           *j = ~s;
+         }
+       }
+     }
+   }
+ 
+   /* Construct the suffix array by using
+      the sorted order of type B suffixes. */
+   k = SA + BUCKET_A(c2 = T[n - 1]);
+   *k++ = (T[n - 2] < c2) ? ~(n - 1) : (n - 1);
+   /* Scan the suffix array from left to right. */
+   for(i = SA, j = SA + n; i < j; ++i) {
+     if(0 < (s = *i)) {
+       assert(T[s - 1] >= T[s]);
+       c0 = T[--s];
+       if((s == 0) || (T[s - 1] < c0)) { s = ~s; }
+       if(c0 != c2) {
+         BUCKET_A(c2) = k - SA;
+         k = SA + BUCKET_A(c2 = c0);
+       }
+       assert(i < k);
+       *k++ = s;
+     } else {
+       assert(s < 0);
+       *i = ~s;
+     }
+   }
+ }
+ 
+ /* Constructs the burrows-wheeler transformed string directly
+    by using the sorted order of type B* suffixes. */
+ static
+ int
+ construct_BWT(const unsigned char *T, int *SA,
+               int *bucket_A, int *bucket_B,
+               int n, int m) {
+   int *i, *j, *k, *orig;
+   int s;
+   int c0, c1, c2;
+ 
+   if(0 < m) {
+     /* Construct the sorted order of type B suffixes by using
+        the sorted order of type B* suffixes. */
+     for(c1 = ALPHABET_SIZE - 2; 0 <= c1; --c1) {
+       /* Scan the suffix array from right to left. */
+       for(i = SA + BUCKET_BSTAR(c1, c1 + 1),
+           j = SA + BUCKET_A(c1 + 1) - 1, k = NULL, c2 = -1;
+           i <= j;
+           --j) {
+         if(0 < (s = *j)) {
+           assert(T[s] == c1);
+           assert(((s + 1) < n) && (T[s] <= T[s + 1]));
+           assert(T[s - 1] <= T[s]);
+           c0 = T[--s];
+           *j = ~((int)c0);
+           if((0 < s) && (T[s - 1] > c0)) { s = ~s; }
+           if(c0 != c2) {
+             if(0 <= c2) { BUCKET_B(c2, c1) = k - SA; }
+             k = SA + BUCKET_B(c2 = c0, c1);
+           }
+           assert(k < j); assert(k != NULL);
+           *k-- = s;
+         } else if(s != 0) {
+           *j = ~s;
+ #ifndef NDEBUG
+         } else {
+           assert(T[s] == c1);
+ #endif
+         }
+       }
+     }
+   }
+ 
+   /* Construct the BWTed string by using
+      the sorted order of type B suffixes. */
+   k = SA + BUCKET_A(c2 = T[n - 1]);
+   *k++ = (T[n - 2] < c2) ? ~((int)T[n - 2]) : (n - 1);
+   /* Scan the suffix array from left to right. */
+   for(i = SA, j = SA + n, orig = SA; i < j; ++i) {
+     if(0 < (s = *i)) {
+       assert(T[s - 1] >= T[s]);
+       c0 = T[--s];
+       *i = c0;
+       if((0 < s) && (T[s - 1] < c0)) { s = ~((int)T[s - 1]); }
+       if(c0 != c2) {
+         BUCKET_A(c2) = k - SA;
+         k = SA + BUCKET_A(c2 = c0);
+       }
+       assert(i < k);
+       *k++ = s;
+     } else if(s != 0) {
+       *i = ~s;
+     } else {
+       orig = i;
+     }
+   }
+ 
+   return orig - SA;
+ }
+ 
+ /* Constructs the burrows-wheeler transformed string directly
+    by using the sorted order of type B* suffixes. */
+ static
+ int
+ construct_BWT_indexes(const unsigned char *T, int *SA,
+                       int *bucket_A, int *bucket_B,
+                       int n, int m,
+                       unsigned char * num_indexes, int * indexes) {
+   int *i, *j, *k, *orig;
+   int s;
+   int c0, c1, c2;
+ 
+   int mod = n / 8;
+   {
+       mod |= mod >> 1;  mod |= mod >> 2;
+       mod |= mod >> 4;  mod |= mod >> 8;
+       mod |= mod >> 16; mod >>= 1;
+ 
+       *num_indexes = (unsigned char)((n - 1) / (mod + 1));
+   }
+ 
+   if(0 < m) {
+     /* Construct the sorted order of type B suffixes by using
+        the sorted order of type B* suffixes. */
+     for(c1 = ALPHABET_SIZE - 2; 0 <= c1; --c1) {
+       /* Scan the suffix array from right to left. */
+       for(i = SA + BUCKET_BSTAR(c1, c1 + 1),
+           j = SA + BUCKET_A(c1 + 1) - 1, k = NULL, c2 = -1;
+           i <= j;
+           --j) {
+         if(0 < (s = *j)) {
+           assert(T[s] == c1);
+           assert(((s + 1) < n) && (T[s] <= T[s + 1]));
+           assert(T[s - 1] <= T[s]);
+ 
+           if ((s & mod) == 0) indexes[s / (mod + 1) - 1] = j - SA;
+ 
+           c0 = T[--s];
+           *j = ~((int)c0);
+           if((0 < s) && (T[s - 1] > c0)) { s = ~s; }
+           if(c0 != c2) {
+             if(0 <= c2) { BUCKET_B(c2, c1) = k - SA; }
+             k = SA + BUCKET_B(c2 = c0, c1);
+           }
+           assert(k < j); assert(k != NULL);
+           *k-- = s;
+         } else if(s != 0) {
+           *j = ~s;
+ #ifndef NDEBUG
+         } else {
+           assert(T[s] == c1);
+ #endif
+         }
+       }
+     }
+   }
+ 
+   /* Construct the BWTed string by using
+      the sorted order of type B suffixes. */
+   k = SA + BUCKET_A(c2 = T[n - 1]);
+   if (T[n - 2] < c2) {
+     if (((n - 1) & mod) == 0) indexes[(n - 1) / (mod + 1) - 1] = k - SA;
+     *k++ = ~((int)T[n - 2]);
+   }
+   else {
+     *k++ = n - 1;
+   }
+ 
+   /* Scan the suffix array from left to right. */
+   for(i = SA, j = SA + n, orig = SA; i < j; ++i) {
+     if(0 < (s = *i)) {
+       assert(T[s - 1] >= T[s]);
+ 
+       if ((s & mod) == 0) indexes[s / (mod + 1) - 1] = i - SA;
+ 
+       c0 = T[--s];
+       *i = c0;
+       if(c0 != c2) {
+         BUCKET_A(c2) = k - SA;
+         k = SA + BUCKET_A(c2 = c0);
+       }
+       assert(i < k);
+       if((0 < s) && (T[s - 1] < c0)) {
+           if ((s & mod) == 0) indexes[s / (mod + 1) - 1] = k - SA;
+           *k++ = ~((int)T[s - 1]);
+       } else
+         *k++ = s;
+     } else if(s != 0) {
+       *i = ~s;
+     } else {
+       orig = i;
+     }
+   }
+ 
+   return orig - SA;
+ }
+ 
+ 
+ /*---------------------------------------------------------------------------*/
+ 
+ /*- Function -*/
+ 
+ int
+ divsufsort(const unsigned char *T, int *SA, int n, int openMP) {
+   int *bucket_A, *bucket_B;
+   int m;
+   int err = 0;
+ 
+   /* Check arguments. */
+   if((T == NULL) || (SA == NULL) || (n < 0)) { return -1; }
+   else if(n == 0) { return 0; }
+   else if(n == 1) { SA[0] = 0; return 0; }
+   else if(n == 2) { m = (T[0] < T[1]); SA[m ^ 1] = 0, SA[m] = 1; return 0; }
+ 
+   bucket_A = (int *)malloc(BUCKET_A_SIZE * sizeof(int));
+   bucket_B = (int *)malloc(BUCKET_B_SIZE * sizeof(int));
+ 
+   /* Suffixsort. */
+   if((bucket_A != NULL) && (bucket_B != NULL)) {
+     m = sort_typeBstar(T, SA, bucket_A, bucket_B, n, openMP);
+     construct_SA(T, SA, bucket_A, bucket_B, n, m);
+   } else {
+     err = -2;
+   }
+ 
+   free(bucket_B);
+   free(bucket_A);
+ 
+   return err;
+ }
+ 
+ int
+ divbwt(const unsigned char *T, unsigned char *U, int *A, int n, unsigned char * num_indexes, int * indexes, int openMP) {
+   int *B;
+   int *bucket_A, *bucket_B;
+   int m, pidx, i;
+ 
+   /* Check arguments. */
+   if((T == NULL) || (U == NULL) || (n < 0)) { return -1; }
+   else if(n <= 1) { if(n == 1) { U[0] = T[0]; } return n; }
+ 
+   if((B = A) == NULL) { B = (int *)malloc((size_t)(n + 1) * sizeof(int)); }
+   bucket_A = (int *)malloc(BUCKET_A_SIZE * sizeof(int));
+   bucket_B = (int *)malloc(BUCKET_B_SIZE * sizeof(int));
+ 
+   /* Burrows-Wheeler Transform. */
+   if((B != NULL) && (bucket_A != NULL) && (bucket_B != NULL)) {
+     m = sort_typeBstar(T, B, bucket_A, bucket_B, n, openMP);
+ 
+     if (num_indexes == NULL || indexes == NULL) {
+         pidx = construct_BWT(T, B, bucket_A, bucket_B, n, m);
+     } else {
+         pidx = construct_BWT_indexes(T, B, bucket_A, bucket_B, n, m, num_indexes, indexes);
+     }
+ 
+     /* Copy to output string. */
+     U[0] = T[n - 1];
+     for(i = 0; i < pidx; ++i) { U[i + 1] = (unsigned char)B[i]; }
+     for(i += 1; i < n; ++i) { U[i] = (unsigned char)B[i]; }
+     pidx += 1;
+   } else {
+     pidx = -2;
+   }
+ 
+   free(bucket_B);
+   free(bucket_A);
+   if(A == NULL) { free(B); }
+ 
+   return pidx;
+ }
--- a/vendor/github.com/DataDog/zstd/divsufsort.h 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/divsufsort.h 0 → 100644
查看文件 @4f5343b
+ /*
+  * divsufsort.h for libdivsufsort-lite
+  * Copyright (c) 2003-2008 Yuta Mori All Rights Reserved.
+  *
+  * Permission is hereby granted, free of charge, to any person
+  * obtaining a copy of this software and associated documentation
+  * files (the "Software"), to deal in the Software without
+  * restriction, including without limitation the rights to use,
+  * copy, modify, merge, publish, distribute, sublicense, and/or sell
+  * copies of the Software, and to permit persons to whom the
+  * Software is furnished to do so, subject to the following
+  * conditions:
+  *
+  * The above copyright notice and this permission notice shall be
+  * included in all copies or substantial portions of the Software.
+  *
+  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+  * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+  * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+  * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+  * OTHER DEALINGS IN THE SOFTWARE.
+  */
+ 
+ #ifndef _DIVSUFSORT_H
+ #define _DIVSUFSORT_H 1
+ 
+ #ifdef __cplusplus
+ extern "C" {
+ #endif /* __cplusplus */
+ 
+ 
+ /*- Prototypes -*/
+ 
+ /**
+  * Constructs the suffix array of a given string.
+  * @param T [0..n-1] The input string.
+  * @param SA [0..n-1] The output array of suffixes.
+  * @param n The length of the given string.
+  * @param openMP enables OpenMP optimization.
+  * @return 0 if no error occurred, -1 or -2 otherwise.
+  */
+ int
+ divsufsort(const unsigned char *T, int *SA, int n, int openMP);
+ 
+ /**
+  * Constructs the burrows-wheeler transformed string of a given string.
+  * @param T [0..n-1] The input string.
+  * @param U [0..n-1] The output string. (can be T)
+  * @param A [0..n-1] The temporary array. (can be NULL)
+  * @param n The length of the given string.
+  * @param num_indexes The length of secondary indexes array. (can be NULL)
+  * @param indexes The secondary indexes array. (can be NULL)
+  * @param openMP enables OpenMP optimization.
+  * @return The primary index if no error occurred, -1 or -2 otherwise.
+  */
+ int
+ divbwt(const unsigned char *T, unsigned char *U, int *A, int n, unsigned char * num_indexes, int * indexes, int openMP);
+ 
+ 
+ #ifdef __cplusplus
+ } /* extern "C" */
+ #endif /* __cplusplus */
+ 
+ #endif /* _DIVSUFSORT_H */
--- a/vendor/github.com/DataDog/zstd/entropy_common.c 0 → 100644
查看文件 @4f5343b
+++ b/vendor/github.com/DataDog/zstd/entropy_common.c 0 → 100644
查看文件 @4f5343b
+ /*
+    Common functions of New Generation Entropy library
+    Copyright (C) 2016, Yann Collet.
+ 
+    BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
+ 
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions are
+    met:
+ 
+        * Redistributions of source code must retain the above copyright
+    notice, this list of conditions and the following disclaimer.
+        * Redistributions in binary form must reproduce the above
+    copyright notice, this list of conditions and the following disclaimer
+    in the documentation and/or other materials provided with the
+    distribution.
+ 
+    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+    "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+    OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+    SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+    LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+    DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+    THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+    (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+    OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ 
+     You can contact the author at :
+     - FSE+HUF source repository : https://github.com/Cyan4973/FiniteStateEntropy
+     - Public forum : https://groups.google.com/forum/#!forum/lz4c
+ *************************************************************************** */
+ 
+ /* *************************************
+ *  Dependencies
+ ***************************************/
+ #include "mem.h"
+ #include "error_private.h"       /* ERR_*, ERROR */
+ #define FSE_STATIC_LINKING_ONLY  /* FSE_MIN_TABLELOG */
+ #include "fse.h"
+ #define HUF_STATIC_LINKING_ONLY  /* HUF_TABLELOG_ABSOLUTEMAX */
+ #include "huf.h"
+ 
+ 
+ /*===   Version   ===*/
+ unsigned FSE_versionNumber(void) { return FSE_VERSION_NUMBER; }
+ 
+ 
+ /*===   Error Management   ===*/
+ unsigned FSE_isError(size_t code) { return ERR_isError(code); }
+ const char* FSE_getErrorName(size_t code) { return ERR_getErrorName(code); }
+ 
+ unsigned HUF_isError(size_t code) { return ERR_isError(code); }
+ const char* HUF_getErrorName(size_t code) { return ERR_getErrorName(code); }
+ 
+ 
+ /*-**************************************************************
+ *  FSE NCount encoding-decoding
+ ****************************************************************/
+ size_t FSE_readNCount (short* normalizedCounter, unsigned* maxSVPtr, unsigned* tableLogPtr,
+                  const void* headerBuffer, size_t hbSize)
+ {
+     const BYTE* const istart = (const BYTE*) headerBuffer;
+     const BYTE* const iend = istart + hbSize;
+     const BYTE* ip = istart;
+     int nbBits;
+     int remaining;
+     int threshold;
+     U32 bitStream;
+     int bitCount;
+     unsigned charnum = 0;
+     int previous0 = 0;
+ 
+     if (hbSize < 4) {
+         /* This function only works when hbSize >= 4 */
+         char buffer[4];
+         memset(buffer, 0, sizeof(buffer));
+         memcpy(buffer, headerBuffer, hbSize);
+         {   size_t const countSize = FSE_readNCount(normalizedCounter, maxSVPtr, tableLogPtr,
+                                                     buffer, sizeof(buffer));
+             if (FSE_isError(countSize)) return countSize;
+             if (countSize > hbSize) return ERROR(corruption_detected);
+             return countSize;
+     }   }
+     assert(hbSize >= 4);
+ 
+     /* init */
+     memset(normalizedCounter, 0, (*maxSVPtr+1) * sizeof(normalizedCounter[0]));   /* all symbols not present in NCount have a frequency of 0 */
+     bitStream = MEM_readLE32(ip);
+     nbBits = (bitStream & 0xF) + FSE_MIN_TABLELOG;   /* extract tableLog */
+     if (nbBits > FSE_TABLELOG_ABSOLUTE_MAX) return ERROR(tableLog_tooLarge);
+     bitStream >>= 4;
+     bitCount = 4;
+     *tableLogPtr = nbBits;
+     remaining = (1<<nbBits)+1;
+     threshold = 1<<nbBits;
+     nbBits++;
+ 
+     while ((remaining>1) & (charnum<=*maxSVPtr)) {
+         if (previous0) {
+             unsigned n0 = charnum;
+             while ((bitStream & 0xFFFF) == 0xFFFF) {
+                 n0 += 24;
+                 if (ip < iend-5) {
+                     ip += 2;
+                     bitStream = MEM_readLE32(ip) >> bitCount;
+                 } else {
+                     bitStream >>= 16;
+                     bitCount   += 16;
+             }   }
+             while ((bitStream & 3) == 3) {
+                 n0 += 3;
+                 bitStream >>= 2;
+                 bitCount += 2;
+             }
+             n0 += bitStream & 3;
+             bitCount += 2;
+             if (n0 > *maxSVPtr) return ERROR(maxSymbolValue_tooSmall);
+             while (charnum < n0) normalizedCounter[charnum++] = 0;
+             if ((ip <= iend-7) || (ip + (bitCount>>3) <= iend-4)) {
+                 assert((bitCount >> 3) <= 3); /* For first condition to work */
+                 ip += bitCount>>3;
+                 bitCount &= 7;
+                 bitStream = MEM_readLE32(ip) >> bitCount;
+             } else {
+                 bitStream >>= 2;
+         }   }
+         {   int const max = (2*threshold-1) - remaining;
+             int count;
+ 
+             if ((bitStream & (threshold-1)) < (U32)max) {
+                 count = bitStream & (threshold-1);
+                 bitCount += nbBits-1;
+             } else {
+                 count = bitStream & (2*threshold-1);
+                 if (count >= threshold) count -= max;
+                 bitCount += nbBits;
+             }
+ 
+             count--;   /* extra accuracy */
+             remaining -= count < 0 ? -count : count;   /* -1 means +1 */
+             normalizedCounter[charnum++] = (short)count;
+             previous0 = !count;
+             while (remaining < threshold) {
+                 nbBits--;
+                 threshold >>= 1;
+             }
+ 
+             if ((ip <= iend-7) || (ip + (bitCount>>3) <= iend-4)) {
+                 ip += bitCount>>3;
+                 bitCount &= 7;
+             } else {
+                 bitCount -= (int)(8 * (iend - 4 - ip));
+                 ip = iend - 4;
+             }
+             bitStream = MEM_readLE32(ip) >> (bitCount & 31);
+     }   }   /* while ((remaining>1) & (charnum<=*maxSVPtr)) */
+     if (remaining != 1) return ERROR(corruption_detected);
+     if (bitCount > 32) return ERROR(corruption_detected);
+     *maxSVPtr = charnum-1;
+ 
+     ip += (bitCount+7)>>3;
+     return ip-istart;
+ }
+ 
+ 
+ /*! HUF_readStats() :
+     Read compact Huffman tree, saved by HUF_writeCTable().
+     `huffWeight` is destination buffer.
+     `rankStats` is assumed to be a table of at least HUF_TABLELOG_MAX U32.
+     @return : size read from `src` , or an error Code .
+     Note : Needed by HUF_readCTable() and HUF_readDTableX?() .
+ */
+ size_t HUF_readStats(BYTE* huffWeight, size_t hwSize, U32* rankStats,
+                      U32* nbSymbolsPtr, U32* tableLogPtr,
+                      const void* src, size_t srcSize)
+ {
+     U32 weightTotal;
+     const BYTE* ip = (const BYTE*) src;
+     size_t iSize;
+     size_t oSize;
+ 
+     if (!srcSize) return ERROR(srcSize_wrong);
+     iSize = ip[0];
+     /* memset(huffWeight, 0, hwSize);   *//* is not necessary, even though some analyzer complain ... */
+ 
+     if (iSize >= 128) {  /* special header */
+         oSize = iSize - 127;
+         iSize = ((oSize+1)/2);
+         if (iSize+1 > srcSize) return ERROR(srcSize_wrong);
+         if (oSize >= hwSize) return ERROR(corruption_detected);
+         ip += 1;
+         {   U32 n;
+             for (n=0; n<oSize; n+=2) {
+                 huffWeight[n]   = ip[n/2] >> 4;
+                 huffWeight[n+1] = ip[n/2] & 15;
+     }   }   }
+     else  {   /* header compressed with FSE (normal case) */
+         FSE_DTable fseWorkspace[FSE_DTABLE_SIZE_U32(6)];  /* 6 is max possible tableLog for HUF header (maybe even 5, to be tested) */
+         if (iSize+1 > srcSize) return ERROR(srcSize_wrong);
+         oSize = FSE_decompress_wksp(huffWeight, hwSize-1, ip+1, iSize, fseWorkspace, 6);   /* max (hwSize-1) values decoded, as last one is implied */
+         if (FSE_isError(oSize)) return oSize;
+     }
+ 
+     /* collect weight stats */
+     memset(rankStats, 0, (HUF_TABLELOG_MAX + 1) * sizeof(U32));
+     weightTotal = 0;
+     {   U32 n; for (n=0; n<oSize; n++) {
+             if (huffWeight[n] >= HUF_TABLELOG_MAX) return ERROR(corruption_detected);
+             rankStats[huffWeight[n]]++;
+             weightTotal += (1 << huffWeight[n]) >> 1;
+     }   }
+     if (weightTotal == 0) return ERROR(corruption_detected);
+ 
+     /* get last non-null symbol weight (implied, total must be 2^n) */
+     {   U32 const tableLog = BIT_highbit32(weightTotal) + 1;
+         if (tableLog > HUF_TABLELOG_MAX) return ERROR(corruption_detected);
+         *tableLogPtr = tableLog;
+         /* determine last weight */
+         {   U32 const total = 1 << tableLog;
+             U32 const rest = total - weightTotal;
+             U32 const verif = 1 << BIT_highbit32(rest);
+             U32 const lastWeight = BIT_highbit32(rest) + 1;
+             if (verif != rest) return ERROR(corruption_detected);    /* last value must be a clean power of 2 */
+             huffWeight[oSize] = (BYTE)lastWeight;
+             rankStats[lastWeight]++;
+     }   }
+ 
+     /* check tree construction validity */
+     if ((rankStats[1] < 2) || (rankStats[1] & 1)) return ERROR(corruption_detected);   /* by construction : at least 2 elts of rank 1, must be even */
+ 
+     /* results */
+     *nbSymbolsPtr = (U32)(oSize+1);
+     return iSize+1;
+ }