From 2a1e6533b78c474a792888b64fecbfce85f5403d Mon Sep 17 00:00:00 2001
From: "Jonathan A. Sternberg" <jonathan@influxdb.com>
Date: Tue, 21 Jun 2016 10:31:05 -0500
Subject: [PATCH] Rename dumptsmdev to dumptsm in influx_inspect

Removes the old implementation of `dumptsm`. It was for an older version
of the tsm1 files that is no longer used and now just panics when used
on a tsm1 file. dumptsmdev has been renamed to `dumptsm`, but the old
`dumptsmdev` command still works for compatibility.
---
 CHANGELOG.md               |   1 +
 cmd/influx_inspect/main.go |  40 +---
 cmd/influx_inspect/tsm.go  | 383 -------------------------------------
 3 files changed, 6 insertions(+), 418 deletions(-)
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 7314b510da5..e78987076d5 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -70,6 +70,7 @@ With this release the systemd configuration files for InfluxDB will use the syst
 - [#6859](https://github.com/influxdata/influxdb/issues/6859): Set the condition cursor instead of aux iterator when creating a nil condition cursor.
 - [#6869](https://github.com/influxdata/influxdb/issues/6869): Remove FieldCodec from tsdb package.
 - [#6882](https://github.com/influxdata/influxdb/pull/6882): Remove a double lock in the tsm1 index writer.
+- [#6883](https://github.com/influxdata/influxdb/pull/6883): Rename dumptsmdev to dumptsm in influx_inspect.
 
 ## v0.13.0 [2016-05-12]
 
diff --git a/cmd/influx_inspect/main.go b/cmd/influx_inspect/main.go
index fceb4b79463..88e7003bea7 100644
--- a/cmd/influx_inspect/main.go
+++ b/cmd/influx_inspect/main.go
@@ -16,8 +16,7 @@ Displays detailed information about InfluxDB data files.
 
 	println(`Commands:
   info - displays series meta-data for all shards.  Default location [$HOME/.influxdb]
-  dumptsm - dumps low-level details about tsm1 files.
-  dumptsmdev - dumps low-level details about tsm1dev files.`)
+  dumptsm - dumps low-level details about tsm1 files.`)
 	println()
 }
 
@@ -38,7 +37,7 @@ func main() {
 		fs.StringVar(&path, "dir", os.Getenv("HOME")+"/.influxdb", "Root storage path. [$HOME/.influxdb]")
 
 		fs.Usage = func() {
-			println("Usage: influx_inspect info [options]\n\n   Displays series meta-data for all shards..")
+			println("Usage: influx_inspect info [options]\n\n   Displays series meta-data for all shards.")
 			println()
 			println("Options:")
 			fs.PrintDefaults()
@@ -49,6 +48,9 @@ func main() {
 			os.Exit(1)
 		}
 		cmdInfo(path)
+	case "dumptsmdev":
+		fmt.Fprintf(os.Stderr, "warning: dumptsmdev is deprecated, use dumptsm instead.\n")
+		fallthrough
 	case "dumptsm":
 		var dumpAll bool
 		opts := &tsdmDumpOpts{}
@@ -81,38 +83,6 @@ func main() {
 		opts.dumpBlocks = opts.dumpBlocks || dumpAll || opts.filterKey != ""
 		opts.dumpIndex = opts.dumpIndex || dumpAll || opts.filterKey != ""
 		cmdDumpTsm1(opts)
-	case "dumptsmdev":
-		var dumpAll bool
-		opts := &tsdmDumpOpts{}
-		fs := flag.NewFlagSet("file", flag.ExitOnError)
-		fs.BoolVar(&opts.dumpIndex, "index", false, "Dump raw index data")
-		fs.BoolVar(&opts.dumpBlocks, "blocks", false, "Dump raw block data")
-		fs.BoolVar(&dumpAll, "all", false, "Dump all data. Caution: This may print a lot of information")
-		fs.StringVar(&opts.filterKey, "filter-key", "", "Only display index and block data match this key substring")
-
-		fs.Usage = func() {
-			println("Usage: influx_inspect dumptsm [options] <path>\n\n  Dumps low-level details about tsm1 files.")
-			println()
-			println("Options:")
-			fs.PrintDefaults()
-			os.Exit(0)
-		}
-
-		if err := fs.Parse(flag.Args()[1:]); err != nil {
-			fmt.Printf("%v", err)
-			os.Exit(1)
-		}
-
-		if len(fs.Args()) == 0 || fs.Args()[0] == "" {
-			fmt.Printf("TSM file not specified\n\n")
-			fs.Usage()
-			fs.PrintDefaults()
-			os.Exit(1)
-		}
-		opts.path = fs.Args()[0]
-		opts.dumpBlocks = opts.dumpBlocks || dumpAll || opts.filterKey != ""
-		opts.dumpIndex = opts.dumpIndex || dumpAll || opts.filterKey != ""
-		cmdDumpTsm1dev(opts)
 	case "verify":
 		var path string
 		fs := flag.NewFlagSet("verify", flag.ExitOnError)
diff --git a/cmd/influx_inspect/tsm.go b/cmd/influx_inspect/tsm.go
index 84fbe8c25a5..acc7deee6c0 100644
--- a/cmd/influx_inspect/tsm.go
+++ b/cmd/influx_inspect/tsm.go
@@ -2,37 +2,16 @@ package main
 
 import (
 	"encoding/binary"
-	"encoding/json"
 	"fmt"
-	"io/ioutil"
 	"os"
-	"path/filepath"
 	"strconv"
 	"strings"
 	"text/tabwriter"
 	"time"
 
-	"github.com/golang/snappy"
-	"github.com/influxdata/influxdb/tsdb"
 	"github.com/influxdata/influxdb/tsdb/engine/tsm1"
 )
 
-// these consts are for the old tsm format. They can be removed once we remove
-// the inspection for the original tsm1 files.
-const (
-	//IDsFileExtension is the extension for the file that keeps the compressed map
-	// of keys to uint64 IDs.
-	IDsFileExtension = "ids"
-
-	// FieldsFileExtension is the extension for the file that stores compressed field
-	// encoding data for this db
-	FieldsFileExtension = "fields"
-
-	// SeriesFileExtension is the extension for the file that stores the compressed
-	// series metadata for series in this db
-	SeriesFileExtension = "series"
-)
-
 type tsdmDumpOpts struct {
 	dumpIndex  bool
 	dumpBlocks bool
@@ -40,19 +19,6 @@ type tsdmDumpOpts struct {
 	path       string
 }
 
-type tsmIndex struct {
-	series  int
-	offset  int64
-	minTime int64
-	maxTime int64
-	blocks  []*block
-}
-
-type block struct {
-	id     uint64
-	offset int64
-}
-
 type blockStats struct {
 	min, max int
 	counts   [][]int
@@ -104,140 +70,6 @@ var (
 	}
 )
 
-func readFields(path string) (map[string]*tsdb.MeasurementFields, error) {
-	fields := make(map[string]*tsdb.MeasurementFields)
-
-	f, err := os.OpenFile(filepath.Join(path, FieldsFileExtension), os.O_RDONLY, 0666)
-	if os.IsNotExist(err) {
-		return fields, nil
-	} else if err != nil {
-		return nil, err
-	}
-	b, err := ioutil.ReadAll(f)
-	if err != nil {
-		return nil, err
-	}
-
-	data, err := snappy.Decode(nil, b)
-	if err != nil {
-		return nil, err
-	}
-
-	if err := json.Unmarshal(data, &fields); err != nil {
-		return nil, err
-	}
-	return fields, nil
-}
-
-func readSeries(path string) (map[string]*tsdb.Series, error) {
-	series := make(map[string]*tsdb.Series)
-
-	f, err := os.OpenFile(filepath.Join(path, SeriesFileExtension), os.O_RDONLY, 0666)
-	if os.IsNotExist(err) {
-		return series, nil
-	} else if err != nil {
-		return nil, err
-	}
-	defer f.Close()
-	b, err := ioutil.ReadAll(f)
-	if err != nil {
-		return nil, err
-	}
-
-	data, err := snappy.Decode(nil, b)
-	if err != nil {
-		return nil, err
-	}
-
-	if err := json.Unmarshal(data, &series); err != nil {
-		return nil, err
-	}
-
-	return series, nil
-}
-
-func readIds(path string) (map[string]uint64, error) {
-	f, err := os.OpenFile(filepath.Join(path, IDsFileExtension), os.O_RDONLY, 0666)
-	if os.IsNotExist(err) {
-		return nil, nil
-	} else if err != nil {
-		return nil, err
-	}
-	b, err := ioutil.ReadAll(f)
-	if err != nil {
-		return nil, err
-	}
-
-	b, err = snappy.Decode(nil, b)
-	if err != nil {
-		return nil, err
-	}
-
-	ids := make(map[string]uint64)
-	if b != nil {
-		if err := json.Unmarshal(b, &ids); err != nil {
-			return nil, err
-		}
-	}
-	return ids, err
-}
-
-func readIndex(f *os.File) (*tsmIndex, error) {
-	// Get the file size
-	stat, err := f.Stat()
-	if err != nil {
-		return nil, err
-	}
-
-	// Seek to the series count
-	f.Seek(-4, os.SEEK_END)
-	b := make([]byte, 8)
-	_, err = f.Read(b[:4])
-	if err != nil {
-		return nil, err
-	}
-
-	seriesCount := binary.BigEndian.Uint32(b)
-
-	// Get the min time
-	f.Seek(-20, os.SEEK_END)
-	f.Read(b)
-	minTime := int64(binary.BigEndian.Uint64(b))
-
-	// Get max time
-	f.Seek(-12, os.SEEK_END)
-	f.Read(b)
-	maxTime := int64(binary.BigEndian.Uint64(b))
-
-	// Figure out where the index starts
-	indexStart := stat.Size() - int64(seriesCount*12+20)
-
-	// Seek to the start of the index
-	f.Seek(indexStart, os.SEEK_SET)
-	count := int(seriesCount)
-	index := &tsmIndex{
-		offset:  indexStart,
-		minTime: minTime,
-		maxTime: maxTime,
-		series:  count,
-	}
-
-	if indexStart < 0 {
-		return nil, fmt.Errorf("index corrupt: offset=%d", indexStart)
-	}
-
-	// Read the index entries
-	for i := 0; i < count; i++ {
-		f.Read(b)
-		id := binary.BigEndian.Uint64(b)
-		f.Read(b[:4])
-		pos := binary.BigEndian.Uint32(b[:4])
-		index.blocks = append(index.blocks, &block{id: id, offset: int64(pos)})
-	}
-
-	return index, nil
-}
-
 func cmdDumpTsm1(opts *tsdmDumpOpts) {
 	var errors []error
 
@@ -247,221 +79,6 @@ func cmdDumpTsm1(opts *tsdmDumpOpts) {
 		os.Exit(1)
 	}
 
-	// Get the file size
-	stat, err := f.Stat()
-	if err != nil {
-		println(err.Error())
-		os.Exit(1)
-	}
-
-	b := make([]byte, 8)
-	f.Read(b[:4])
-
-	// Verify magic number
-	if binary.BigEndian.Uint32(b[:4]) != 0x16D116D1 {
-		println("Not a tsm1 file.")
-		os.Exit(1)
-	}
-
-	ids, err := readIds(filepath.Dir(opts.path))
-	if err != nil {
-		println("Failed to read series:", err.Error())
-		os.Exit(1)
-	}
-
-	invIds := map[uint64]string{}
-	for k, v := range ids {
-		invIds[v] = k
-	}
-
-	index, err := readIndex(f)
-	if err != nil {
-		println("Failed to readIndex:", err.Error())
-
-		// Create a stubbed out index so we can still try and read the block data directly
-		// w/o panicing ourselves.
-		index = &tsmIndex{
-			minTime: 0,
-			maxTime: 0,
-			offset:  stat.Size(),
-		}
-	}
-
-	blockStats := &blockStats{}
-
-	println("Summary:")
-	fmt.Printf("  File: %s\n", opts.path)
-	fmt.Printf("  Time Range: %s - %s\n",
-		time.Unix(0, index.minTime).UTC().Format(time.RFC3339Nano),
-		time.Unix(0, index.maxTime).UTC().Format(time.RFC3339Nano),
-	)
-	fmt.Printf("  Duration: %s ", time.Unix(0, index.maxTime).Sub(time.Unix(0, index.minTime)))
-	fmt.Printf("  Series: %d ", index.series)
-	fmt.Printf("  File Size: %d\n", stat.Size())
-	println()
-
-	tw := tabwriter.NewWriter(os.Stdout, 8, 8, 1, '\t', 0)
-	fmt.Fprintln(tw, "  "+strings.Join([]string{"Pos", "ID", "Ofs", "Key", "Field"}, "\t"))
-	for i, block := range index.blocks {
-		key := invIds[block.id]
-		split := strings.Split(key, "#!~#")
-
-		// We dont' know know if we have fields so use an informative default
-		var measurement, field string = "UNKNOWN", "UNKNOWN"
-
-		// We read some IDs from the ids file
-		if len(invIds) > 0 {
-			// Change the default to error until we know we have a valid key
-			measurement = "ERR"
-			field = "ERR"
-
-			// Possible corruption? Try to read as much as we can and point to the problem.
-			if key == "" {
-				errors = append(errors, fmt.Errorf("index pos %d, field id: %d, missing key for id", i, block.id))
-			} else if len(split) < 2 {
-				errors = append(errors, fmt.Errorf("index pos %d, field id: %d, key corrupt: got '%v'", i, block.id, key))
-			} else {
-				measurement = split[0]
-				field = split[1]
-			}
-		}
-
-		if opts.filterKey != "" && !strings.Contains(key, opts.filterKey) {
-			continue
-		}
-		fmt.Fprintln(tw, "  "+strings.Join([]string{
-			strconv.FormatInt(int64(i), 10),
-			strconv.FormatUint(block.id, 10),
-			strconv.FormatInt(int64(block.offset), 10),
-			measurement,
-			field,
-		}, "\t"))
-	}
-
-	if opts.dumpIndex {
-		println("Index:")
-		tw.Flush()
-		println()
-	}
-
-	tw = tabwriter.NewWriter(os.Stdout, 8, 8, 1, '\t', 0)
-	fmt.Fprintln(tw, "  "+strings.Join([]string{"Blk", "Ofs", "Len", "ID", "Type", "Min Time", "Points", "Enc [T/V]", "Len [T/V]"}, "\t"))
-
-	// Staring at 4 because the magic number is 4 bytes
-	i := int64(4)
-	var blockCount, pointCount, blockSize int64
-	indexSize := stat.Size() - index.offset
-
-	// Start at the beginning and read every block
-	for i < index.offset {
-		f.Seek(int64(i), 0)
-
-		f.Read(b)
-		id := binary.BigEndian.Uint64(b)
-		f.Read(b[:4])
-		length := binary.BigEndian.Uint32(b[:4])
-		buf := make([]byte, length)
-		f.Read(buf)
-
-		blockSize += int64(len(buf)) + 12
-
-		startTime := time.Unix(0, int64(binary.BigEndian.Uint64(buf[:8])))
-		blockType := buf[8]
-
-		encoded := buf[9:]
-
-		cnt := tsm1.BlockCount(buf)
-		pointCount += int64(cnt)
-
-		// Length of the timestamp block
-		tsLen, j := binary.Uvarint(encoded)
-
-		// Unpack the timestamp bytes
-		ts := encoded[int(j) : int(j)+int(tsLen)]
-
-		// Unpack the value bytes
-		values := encoded[int(j)+int(tsLen):]
-
-		tsEncoding := timeEnc[int(ts[0]>>4)]
-		vEncoding := encDescs[int(blockType+1)][values[0]>>4]
-
-		typeDesc := blockTypes[blockType]
-
-		blockStats.inc(0, ts[0]>>4)
-		blockStats.inc(int(blockType+1), values[0]>>4)
-		blockStats.size(len(buf))
-
-		if opts.filterKey != "" && !strings.Contains(invIds[id], opts.filterKey) {
-			i += (12 + int64(length))
-			blockCount++
-			continue
-		}
-
-		fmt.Fprintln(tw, "  "+strings.Join([]string{
-			strconv.FormatInt(blockCount, 10),
-			strconv.FormatInt(i, 10),
-			strconv.FormatInt(int64(len(buf)), 10),
-			strconv.FormatUint(id, 10),
-			typeDesc,
-			startTime.UTC().Format(time.RFC3339Nano),
-			strconv.FormatInt(int64(cnt), 10),
-			fmt.Sprintf("%s/%s", tsEncoding, vEncoding),
-			fmt.Sprintf("%d/%d", len(ts), len(values)),
-		}, "\t"))
-
-		i += (12 + int64(length))
-		blockCount++
-	}
-	if opts.dumpBlocks {
-		println("Blocks:")
-		tw.Flush()
-		println()
-	}
-
-	fmt.Printf("Statistics\n")
-	fmt.Printf("  Blocks:\n")
-	fmt.Printf("    Total: %d Size: %d Min: %d Max: %d Avg: %d\n",
-		blockCount, blockSize, blockStats.min, blockStats.max, blockSize/blockCount)
-	fmt.Printf("  Index:\n")
-	fmt.Printf("    Total: %d Size: %d\n", len(index.blocks), indexSize)
-	fmt.Printf("  Points:\n")
-	fmt.Printf("    Total: %d", pointCount)
-	println()
-
-	println("  Encoding:")
-	for i, counts := range blockStats.counts {
-		if len(counts) == 0 {
-			continue
-		}
-		fmt.Printf("    %s: ", strings.Title(fieldType[i]))
-		for j, v := range counts {
-			fmt.Printf("\t%s: %d (%d%%) ", encDescs[i][j], v, int(float64(v)/float64(blockCount)*100))
-		}
-		println()
-	}
-	fmt.Printf("  Compression:\n")
-	fmt.Printf("    Per block: %0.2f bytes/point\n", float64(blockSize)/float64(pointCount))
-	fmt.Printf("    Total: %0.2f bytes/point\n", float64(stat.Size())/float64(pointCount))
-
-	if len(errors) > 0 {
-		println()
-		fmt.Printf("Errors (%d):\n", len(errors))
-		for _, err := range errors {
-			fmt.Printf("  * %v\n", err)
-		}
-		println()
-	}
-}
-
-func cmdDumpTsm1dev(opts *tsdmDumpOpts) {
-	var errors []error
-
-	f, err := os.Open(opts.path)
-	if err != nil {
-		println(err.Error())
-		os.Exit(1)
-	}
-
 	// Get the file size
 	stat, err := f.Stat()
 	if err != nil {