Add csv parser unix timestamp support (#5047)

This commit is contained in:
Felipe Dutra Tine e Silva 2018-11-28 19:07:25 -05:00 committed by Daniel Nelson
parent 168c2b0ed1
commit f9113b63b7
3 changed files with 58 additions and 16 deletions

View File

@ -75,7 +75,8 @@ document.
The `csv_timestamp_column` option specifies the column name containing the The `csv_timestamp_column` option specifies the column name containing the
time value and `csv_timestamp_format` must be set to a Go "reference time" time value and `csv_timestamp_format` must be set to a Go "reference time"
which is defined to be the specific time: `Mon Jan 2 15:04:05 MST 2006`. which is defined to be the specific time: `Mon Jan 2 15:04:05 MST 2006`,
it can also be `unix` (for epoch in ms format like 1257894000 )
Consult the Go [time][time parse] package for details and additional examples Consult the Go [time][time parse] package for details and additional examples
on how to set the time format. on how to set the time format.

View File

@ -207,21 +207,9 @@ outer:
measurementName = fmt.Sprintf("%v", recordFields[p.MeasurementColumn]) measurementName = fmt.Sprintf("%v", recordFields[p.MeasurementColumn])
} }
metricTime := p.TimeFunc() metricTime, err := parseTimestamp(p.TimeFunc, recordFields, p.TimestampColumn, p.TimestampFormat)
if p.TimestampColumn != "" { if err != nil {
if recordFields[p.TimestampColumn] == nil { return nil, err
return nil, fmt.Errorf("timestamp column: %v could not be found", p.TimestampColumn)
}
tStr := fmt.Sprintf("%v", recordFields[p.TimestampColumn])
if p.TimestampFormat == "" {
return nil, fmt.Errorf("timestamp format must be specified")
}
var err error
metricTime, err = time.Parse(p.TimestampFormat, tStr)
if err != nil {
return nil, err
}
} }
m, err := metric.New(measurementName, tags, recordFields, metricTime) m, err := metric.New(measurementName, tags, recordFields, metricTime)
@ -231,6 +219,41 @@ outer:
return m, nil return m, nil
} }
// ParseTimestamp return a timestamp, if there is no timestamp on the csv it will be the current timestamp, else it will try to parse the time according to the format
// if the format is "unix" it tries to parse assuming that on the csv it will find an epoch in ms.
func parseTimestamp(timeFunc func() time.Time, recordFields map[string]interface{}, timestampColumn, timestampFormat string) (metricTime time.Time, err error) {
metricTime = timeFunc()
if timestampColumn != "" {
if recordFields[timestampColumn] == nil {
err = fmt.Errorf("timestamp column: %v could not be found", timestampColumn)
return
}
tStr := fmt.Sprintf("%v", recordFields[timestampColumn])
switch timestampFormat {
case "":
err = fmt.Errorf("timestamp format must be specified")
return
case "unix":
var unixTime int64
unixTime, err = strconv.ParseInt(tStr, 10, 64)
if err != nil {
return
}
metricTime = time.Unix(unixTime, 0)
default:
metricTime, err = time.Parse(timestampFormat, tStr)
if err != nil {
return
}
}
}
return
}
// SetDefaultTags set the DefaultTags
func (p *Parser) SetDefaultTags(tags map[string]string) { func (p *Parser) SetDefaultTags(tags map[string]string) {
p.DefaultTags = tags p.DefaultTags = tags
} }

View File

@ -88,6 +88,24 @@ func TestTimestampError(t *testing.T) {
require.Equal(t, fmt.Errorf("timestamp format must be specified"), err) require.Equal(t, fmt.Errorf("timestamp format must be specified"), err)
} }
func TestTimestampUnixFormat(t *testing.T) {
p := Parser{
HeaderRowCount: 1,
ColumnNames: []string{"first", "second", "third"},
MeasurementColumn: "third",
TimestampColumn: "first",
TimestampFormat: "unix",
TimeFunc: DefaultTime,
}
testCSV := `line1,line2,line3
1243094706,70,test_name
1257609906,80,test_name2`
metrics, err := p.Parse([]byte(testCSV))
require.NoError(t, err)
require.Equal(t, metrics[0].Time().UnixNano(), int64(1243094706000000000))
require.Equal(t, metrics[1].Time().UnixNano(), int64(1257609906000000000))
}
func TestQuotedCharacter(t *testing.T) { func TestQuotedCharacter(t *testing.T) {
p := Parser{ p := Parser{
HeaderRowCount: 1, HeaderRowCount: 1,