mirror of
https://github.com/dolthub/dolt.git
synced 2026-05-04 19:41:26 -05:00
150 lines
3.9 KiB
Go
150 lines
3.9 KiB
Go
// Copyright 2019 Dolthub, Inc.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package main
|
|
|
|
import (
|
|
"io"
|
|
"log"
|
|
"strings"
|
|
)
|
|
|
|
// Dataset is a set of test data used for benchmark testing
|
|
type Dataset interface {
|
|
// GenerateData generates a dataset for testing
|
|
GenerateData()
|
|
|
|
// Change returns a Dataset mutated by the given percentage of change
|
|
Change(pct float32) Dataset
|
|
}
|
|
|
|
// DSImpl implements the Dataset interface
|
|
type DSImpl struct {
|
|
// Schema defines the structure of the Dataset
|
|
Schema *SeedSchema
|
|
|
|
// TableName is the name of the test dataset
|
|
TableName string
|
|
|
|
// w is the writer where the test dataset will be written
|
|
w io.Writer
|
|
|
|
// sf is the function used to generate random data values in the dataset
|
|
sf seedFunc
|
|
}
|
|
|
|
// NewDSImpl creates a new DSImpl
|
|
func NewDSImpl(wc io.Writer, sch *SeedSchema, sf seedFunc, tableName string) *DSImpl {
|
|
return &DSImpl{Schema: sch, TableName: tableName, sf: sf, w: wc}
|
|
}
|
|
|
|
// GenerateData generates a dataset and writes it to a io.Writer
|
|
func (ds *DSImpl) GenerateData() {
|
|
writeDataToWriter(ds.w, ds.Schema.Rows, ds.Schema.Columns, ds.sf, ds.TableName, ds.Schema.FileFormatExt)
|
|
}
|
|
|
|
// Change returns a DataSet that is a mutation of this Dataset by the given percentage
|
|
func (ds *DSImpl) Change(pct float32) Dataset {
|
|
// TODO
|
|
return &DSImpl{}
|
|
}
|
|
|
|
func writeDataToWriter(wc io.Writer, rows int, cols []*SeedColumn, sf seedFunc, tableName, format string) {
|
|
// handle the "header" for all format types
|
|
writeHeader(wc, cols, tableName, format)
|
|
|
|
var prevRow []string
|
|
for i := 0; i < rows; i++ {
|
|
row := make([]string, len(cols))
|
|
|
|
for colIndex, col := range cols {
|
|
val := getColValue(prevRow, colIndex, col, sf, format)
|
|
row[colIndex] = val
|
|
|
|
if i > 0 && prevRow != nil {
|
|
prevRow[colIndex] = val
|
|
}
|
|
}
|
|
_, err := wc.Write([]byte(formatRow(row, cols, i, rows-1, tableName, format)))
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
prevRow = row[:]
|
|
}
|
|
|
|
// handle the "footer" for format types
|
|
switch format {
|
|
case jsonExt:
|
|
suffix := "]}\n"
|
|
_, err := wc.Write([]byte(suffix))
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
default:
|
|
}
|
|
}
|
|
|
|
func writeHeader(w io.Writer, cols []*SeedColumn, tableName, format string) {
|
|
switch format {
|
|
case csvExt:
|
|
header := makeCSVHeaderStr(cols, tableName, format)
|
|
_, err := w.Write([]byte(header + "\n"))
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
case sqlExt:
|
|
header := getSQLHeader(cols, tableName, format)
|
|
_, err := w.Write([]byte(header + "\n"))
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
case jsonExt:
|
|
prefix := "{\"Rows\":["
|
|
_, err := w.Write([]byte(prefix))
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
default:
|
|
log.Fatalf("unable to write the header, unsupported format %v \n", format)
|
|
}
|
|
}
|
|
|
|
func formatRow(strs []string, cols []*SeedColumn, currentRowIdx, lastRowIdx int, tableName, format string) string {
|
|
switch format {
|
|
case csvExt:
|
|
return strings.Join(strs, ",") + "\n"
|
|
case sqlExt:
|
|
return getSQLRow(strs, cols, tableName) + "\n"
|
|
case jsonExt:
|
|
var suffix string
|
|
if currentRowIdx == lastRowIdx {
|
|
suffix = "\n"
|
|
} else {
|
|
suffix = ",\n"
|
|
}
|
|
return getJSONRow(strs, cols) + suffix
|
|
default:
|
|
log.Fatalf("cannot format row, unsupported file format %s \n", format)
|
|
}
|
|
return ""
|
|
}
|
|
|
|
func makeCSVHeaderStr(cols []*SeedColumn, tableName, format string) string {
|
|
str := make([]string, 0, len(cols))
|
|
for _, col := range cols {
|
|
str = append(str, col.Name)
|
|
}
|
|
return formatRow(str, cols, 0, 1, tableName, format)
|
|
}
|