Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

WebAdmin Crashed. InfluxDB does not start. #369

Closed
samuraraujo opened this issue Mar 28, 2014 · 23 comments
Closed

WebAdmin Crashed. InfluxDB does not start. #369

samuraraujo opened this issue Mar 28, 2014 · 23 comments
Milestone

Comments

@samuraraujo
Copy link

[2014/03/28 10:44:30 BRT] DEBG recovery requestsSinceLastIndex: 749, requestNumber: 186749
[2014/03/28 10:44:30 BRT] DEBG largestrequestnumber: 186749

panic: Replay error. Stacktrace:
goroutine 17 [running]:
common.NewErrorWithStacktrace(0x7f3a8ac847b0, 0xc210162f40, 0xc210162f50, 0x1, 0x1, ...)
/home/vagrant/influxdb/src/common/error_with_stacktrace.go:22 +0x7f
wal.newErrorReplayRequest(0x7f3a8ac847b0, 0xc210162f40, 0x0)
/home/vagrant/influxdb/src/wal/replay_request.go:19 +0xc0
wal.(_log).replayFromFileLocation(0xc2100ea240, 0xc2100c2008, 0xc210125090, 0xc2100e96e0, 0xc2100e8c60)
/home/vagrant/influxdb/src/wal/log.go:254 +0x7ea
wal.func·002()
/home/vagrant/influxdb/src/wal/log.go:133 +0x25b
created by wal.(_log).dupAndReplayFromOffset
/home/vagrant/influxdb/src/wal/log.go:134 +0x16c

Caused by: proto: required field "{Unknown}" not set

goroutine 1 [running]:
runtime.panic(0x857020, 0xc2101099c0)
/home/vagrant/bin/go/src/pkg/runtime/panic.c:266 +0xb6
wal.(_WAL).SetServerId(0xc210070180, 0xc200000001)
/home/vagrant/influxdb/src/wal/wal.go:112 +0x122
server.(_Server).ListenAndServe(0xc21000b150, 0xc21000b150, 0x0)
/home/vagrant/influxdb/src/server/server.go:89 +0x10d
main.main()
/home/vagrant/influxdb/src/daemon/influxd.go:116 +0x599

goroutine 3 [runnable]:
code.google.com/p/log4go.ConsoleLogWriter.run(0xc2100482c0, 0x7f3a8ac77fe8, 0xc210000008)
/home/vagrant/influxdb/src/code.google.com/p/log4go/termlog.go:31 +0x297
created by code.google.com/p/log4go.NewConsoleLogWriter
/home/vagrant/influxdb/src/code.google.com/p/log4go/termlog.go:19 +0x67

goroutine 4 [syscall]:
os/signal.loop()
/home/vagrant/bin/go/src/pkg/os/signal/signal_unix.go:21 +0x1e
created by os/signal.init·1
/home/vagrant/bin/go/src/pkg/os/signal/signal_unix.go:27 +0x31

goroutine 5 [runnable]:
code.google.com/p/log4go.func·002()
/home/vagrant/influxdb/src/code.google.com/p/log4go/filelog.go:84 +0x84c
created by code.google.com/p/log4go.NewFileLogWriter
/home/vagrant/influxdb/src/code.google.com/p/log4go/filelog.go:116 +0x2d1

goroutine 6 [syscall]:
runtime.goexit()
/home/vagrant/bin/go/src/pkg/runtime/proc.c:1394

goroutine 7 [chan receive]:
wal.(*WAL).processEntries(0xc210070180)
/home/vagrant/influxdb/src/wal/wal.go:237 +0x3f
created by wal.NewWAL
/home/vagrant/influxdb/src/wal/wal.go:102 +0x9f3

goroutine 8 [sleep]:
time.Sleep(0x8bb2c97000)
/tmp/makerelease886106415/go/src/pkg/runtime/time.goc:31 +0x31
cluster.func·001()
/home/vagrant/influxdb/src/cluster/cluster_configuration.go:129 +0x35
created by cluster.(*ClusterConfiguration).CreateFutureShardsAutomaticallyBeforeTimeComes
/home/vagrant/influxdb/src/cluster/cluster_configuration.go:134 +0x63

goroutine 9 [IO wait]:
net.runtime_pollWait(0x7f3a8ac79f88, 0x72, 0x0)
/tmp/makerelease886106415/go/src/pkg/runtime/netpoll.goc:116 +0x6a
net.(_pollDesc).Wait(0xc2100f51b0, 0x72, 0x7f3a8ac78120, 0xb)
/home/vagrant/bin/go/src/pkg/net/fd_poll_runtime.go:81 +0x34
net.(_pollDesc).WaitRead(0xc2100f51b0, 0xb, 0x7f3a8ac78120)
/home/vagrant/bin/go/src/pkg/net/fd_poll_runtime.go:86 +0x30
net.(_netFD).accept(0xc2100f5150, 0x9f4698, 0x0, 0x7f3a8ac78120, 0xb)
/home/vagrant/bin/go/src/pkg/net/fd_unix.go:382 +0x2c2
net.(_TCPListener).AcceptTCP(0xc210000918, 0xc210036770, 0x0, 0x7f3a8ac79060)
/home/vagrant/bin/go/src/pkg/net/tcpsock_posix.go:233 +0x47
net.(_TCPListener).Accept(0xc210000918, 0xc210036770, 0x7f3a8aafaf38, 0x1, 0x1)
/home/vagrant/bin/go/src/pkg/net/tcpsock_posix.go:243 +0x27
coordinator.(_ProtobufServer).ListenAndServe(0xc21006eb40)
/home/vagrant/influxdb/src/coordinator/protobuf_server.go:62 +0x1c7
created by server.(*Server).ListenAndServe
/home/vagrant/influxdb/src/server/server.go:80 +0x3d

goroutine 10 [IO wait]:
net.runtime_pollWait(0x7f3a8ac7a030, 0x72, 0x0)
/tmp/makerelease886106415/go/src/pkg/runtime/netpoll.goc:116 +0x6a
net.(_pollDesc).Wait(0xc21000b220, 0x72, 0x7f3a8ac78120, 0xb)
/home/vagrant/bin/go/src/pkg/net/fd_poll_runtime.go:81 +0x34
net.(_pollDesc).WaitRead(0xc21000b220, 0xb, 0x7f3a8ac78120)
/home/vagrant/bin/go/src/pkg/net/fd_poll_runtime.go:86 +0x30
net.(_netFD).accept(0xc21000b1c0, 0x9f4698, 0x0, 0x7f3a8ac78120, 0xb)
/home/vagrant/bin/go/src/pkg/net/fd_unix.go:382 +0x2c2
net.(_TCPListener).AcceptTCP(0xc210000848, 0x18, 0xc2100f8810, 0x5d8d03)
/home/vagrant/bin/go/src/pkg/net/tcpsock_posix.go:233 +0x47
net.(_TCPListener).Accept(0xc210000848, 0x0, 0x0, 0x0, 0x0)
/home/vagrant/bin/go/src/pkg/net/tcpsock_posix.go:243 +0x27
net/http.(_Server).Serve(0xc2100981e0, 0x7f3a8ac79090, 0xc210000848, 0x0, 0x0)
/home/vagrant/bin/go/src/pkg/net/http/server.go:1622 +0x91
coordinator.func·008()
/home/vagrant/influxdb/src/coordinator/raft_server.go:500 +0x3a
created by coordinator.(*RaftServer).Serve
/home/vagrant/influxdb/src/coordinator/raft_server.go:504 +0x519

goroutine 13 [syscall]:
github.com/jmhodges/levigo._Cfunc_leveldb_open(0x1ff32b0, 0x1ff43a0, 0xc210111238, 0xc2100a3d60)
github.com/jmhodges/levigo/_obj/_cgo_defun.c:278 +0x31
github.com/jmhodges/levigo.Open(0xc2100a6f00, 0x2b, 0xc210000020, 0x0, 0x0, ...)
/home/vagrant/influxdb/src/github.com/jmhodges/levigo/db.go:79 +0xb6
datastore.(_LevelDbShardDatastore).GetOrCreateShard(0xc2100722a0, 0x1, 0x0, 0x0, 0x0, ...)
/home/vagrant/influxdb/src/datastore/leveldb_shard_datastore.go:123 +0x2d2
cluster.(_ShardData).SetLocalStore(0xc21006bb60, 0x7f3a8ac78e20, 0xc2100722a0, 0x1, 0x0, ...)
/home/vagrant/influxdb/src/cluster/shard.go:163 +0x10e
cluster.(_ClusterConfiguration).AddShards(0xc210078380, 0xc2100a5b00, 0x1, 0x4, 0x0, ...)
/home/vagrant/influxdb/src/cluster/cluster_configuration.go:824 +0x9bc
coordinator.(_CreateShardsCommand).Apply(0xc2100a5a40, 0x7f3a8ac7a240, 0xc2100a0240, 0x7f3a8ac7abe0, 0xc2100a5a40, ...)
/home/vagrant/influxdb/src/coordinator/command.go:242 +0x92
github.com/goraft/raft.func·005(0xc2100467e0, 0x7f3a8ac78650, 0xc2100a5a40, 0x76, 0x76, ...)
/home/vagrant/influxdb/src/github.com/goraft/raft/server.go:204 +0x364
github.com/goraft/raft.(_Log).setCommitIndex(0xc2100f5690, 0x9, 0x0, 0x0)
/home/vagrant/influxdb/src/github.com/goraft/raft/log.go:371 +0x36e
github.com/goraft/raft.(_server).processCommand(0xc2100a0240, 0x7f3a8ac7a690, 0xc2100a3b10, 0xc2100a67b0)
/home/vagrant/influxdb/src/github.com/goraft/raft/server.go:877 +0x47e
github.com/goraft/raft.(_server).leaderLoop(0xc2100a0240)
/home/vagrant/influxdb/src/github.com/goraft/raft/server.go:800 +0x474
github.com/goraft/raft.(_server).loop(0xc2100a0240)
/home/vagrant/influxdb/src/github.com/goraft/raft/server.go:590 +0x33f
created by github.com/goraft/raft.(*server).Start
/home/vagrant/influxdb/src/github.com/goraft/raft/server.go:460 +0x345

goroutine 14 [select]:
coordinator.(_RaftServer).CompactLog(0xc210073000)
/home/vagrant/influxdb/src/coordinator/raft_server.go:300 +0x2ef
created by coordinator.(_RaftServer).startRaft
/home/vagrant/influxdb/src/coordinator/raft_server.go:338 +0x388

goroutine 15 [select]:
coordinator.(_RaftServer).raftLeaderLoop(0xc210073000, 0xc2100a7740)
/home/vagrant/influxdb/src/coordinator/raft_server.go:407 +0x29c
created by coordinator.(_RaftServer).raftEventHandler
/home/vagrant/influxdb/src/coordinator/raft_server.go:396 +0x1d0

goroutine 16 [chan receive]:
github.com/goraft/raft.(_server).Do(0xc2100a0240, 0x7f3a8ac7a690, 0xc2100a3b10, 0x7f3a8ac7a690, 0xc2100a3b10, ...)
/home/vagrant/influxdb/src/github.com/goraft/raft/server.go:852 +0xfd
created by github.com/goraft/raft.(_server).leaderLoop
/home/vagrant/influxdb/src/github.com/goraft/raft/server.go:782 +0x220

goroutine 18 [finalizer wait]:
runtime.park(0x44fbf0, 0x1018da8, 0x10037c8)
/home/vagrant/bin/go/src/pkg/runtime/proc.c:1342 +0x66
runfinq()
/home/vagrant/bin/go/src/pkg/runtime/mgc0.c:2279 +0x84
runtime.goexit()
/home/vagrant/bin/go/src/pkg/runtime/proc.c:1394

@pauldix
Copy link
Member

pauldix commented Mar 28, 2014

Hey @samuraraujo, is it possible for you to zip up your data directory and post it somewhere for us to test with?

@samuraraujo
Copy link
Author

Hi Paul, I deleted the data directory to be able to start influxdb again. If it happens again I will send you the zip file.

@pauldix
Copy link
Member

pauldix commented Mar 28, 2014

What version are you running? Can you post a gist to your config file?

@samuraraujo
Copy link
Author

$ influxdb -v
InfluxDB v0.5.0 (git: a11a11e)

I did not change anything in the config file from the default ubuntu deb installation.

I noticed that the default log config is in "debug" mode. Maybe the default installation should use "error". The current config makes the log files grow very fast with large data.

@pauldix
Copy link
Member

pauldix commented Mar 28, 2014

Yeah, should probably be "info" or "warn". Also, 0.5.0 isn't the latest version. Can you upgrade to the new one?

@samuraraujo
Copy link
Author

Updated!
$ influxdb -v
InfluxDB v0.5.1 (git: b10dfb5a9366f134e83b0d7cb436474110cc50b1)

@toddboom
Copy link
Contributor

@samuraraujo is this still a current issue, or can it be closed out?

@wladekb
Copy link

wladekb commented May 5, 2014

I'm getting a similar error using the following version:
InfluxDB v0.5.3 (git: 767ba83)
using the default configuration file.

The server was rebooted (influxdb process has probably been killed) and afterwards it continuously crashes when I try to start it up.

I'm gonna do a backup of the data directory (11gb atm) and try to upgrade to 0.6.0 and check if the problem persists.

Logs:

+---------------------------------------------+
|  _____        __ _            _____  ____   |
| |_   _|      / _| |          |  __ \|  _ \  |
|   | |  _ __ | |_| |_   ___  _| |  | | |_) | |
|   | | | '_ \|  _| | | | \ \/ / |  | |  _ <  |
|  _| |_| | | | | | | |_| |>  <| |__| | |_) | |
| |_____|_| |_|_| |_|\__,_/_/\_\_____/|____/  |
+---------------------------------------------+


[2014/05/05 18:05:32 UTC] [INFO] (server.NewServer:33) Opening database at /opt/influxdb/shared/data/db
[2014/05/05 18:05:32 UTC] [INFO] (wal.NewWAL:40) Opening wal in /opt/influxdb/shared/data/wal
[2014/05/05 18:05:32 UTC] [INFO] (wal.(*WAL).openLog:358) Opening log file /opt/influxdb/shared/data/wal/log.38100001
[2014/05/05 18:05:32 UTC] [INFO] (wal.(*WAL).openLog:372) Opening index file /opt/influxdb/shared/data/wal/index.38100001
[2014/05/05 18:05:32 UTC] [INFO] (api/http.(*HttpServer).EnableSsl:55) Ssl will be disabled since the ssl port or certificate path weren't set
[2014/05/05 18:05:32 UTC] [INFO] (coordinator.(*RaftServer).Serve:486) Initializing Raft HTTP server
[2014/05/05 18:05:32 UTC] [INFO] (coordinator.(*ProtobufServer).ListenAndServe:60) ProtobufServer listening on 0.0.0.0:8099
[2014/05/05 18:05:32 UTC] [INFO] (coordinator.(*RaftServer).Serve:497) Raft Server Listening at http://dbstore-s1:8090
[2014/05/05 18:05:32 UTC] [INFO] (coordinator.(*RaftServer).startRaft:320) Initializing Raft Server: /opt/influxdb/shared/data/raft 8090
[2014/05/05 18:05:32 UTC] [INFO] (cluster.(*ClusterConfiguration).Recovery:481) Recovering the cluster configuration
[2014/05/05 18:05:32 UTC] [INFO] (datastore.(*LevelDbShardDatastore).GetOrCreateShard:122) DATASTORE: opening or creating shard /opt/influxdb/shared/data/db/shard_db/00005
[2014/05/05 18:05:32 UTC] [INFO] (datastore.(*LevelDbShardDatastore).GetOrCreateShard:122) DATASTORE: opening or creating shard /opt/influxdb/shared/data/db/shard_db/00004
[2014/05/05 18:05:32 UTC] [INFO] (datastore.(*LevelDbShardDatastore).GetOrCreateShard:122) DATASTORE: opening or creating shard /opt/influxdb/shared/data/db/shard_db/00003
[2014/05/05 18:05:32 UTC] [INFO] (datastore.(*LevelDbShardDatastore).GetOrCreateShard:122) DATASTORE: opening or creating shard /opt/influxdb/shared/data/db/shard_db/00002
[2014/05/05 18:05:32 UTC] [INFO] (datastore.(*LevelDbShardDatastore).GetOrCreateShard:122) DATASTORE: opening or creating shard /opt/influxdb/shared/data/db/shard_db/00001
[2014/05/05 18:05:32 UTC] [INFO] (coordinator.(*RaftServer).startRaft:341) Recovered from log
[2014/05/05 18:05:32 UTC] [INFO] (server.(*Server).ListenAndServe:85) Waiting for local server to be added
[2014/05/05 18:05:32 UTC] [INFO] (wal.(*WAL).SetServerId:109) Setting server id to 1 and recovering
[2014/05/05 18:05:32 UTC] [INFO] (wal.(*WAL).recover:429) Checking /opt/influxdb/shared/data/wal/log.38100001, last: 2536131, size: 2768896
panic: Replay error. Stacktrace:
goroutine 17 [running]:
common.NewErrorWithStacktrace(0x7f569b74ad58, 0xc210178040, 0xc210178050, 0x1, 0x1, ...)
    /home/vagrant/influxdb/src/common/error_with_stacktrace.go:22 +0x7f
wal.newErrorReplayRequest(0x7f569b74ad58, 0xc210178040, 0x0)
    /home/vagrant/influxdb/src/wal/replay_request.go:19 +0xc0
wal.(*log).replayFromFileLocation(0xc2100fb120, 0xc2101362a8, 0xc2101309c0, 0xc21012b8f0, 0xc21011fcc0)
    /home/vagrant/influxdb/src/wal/log.go:254 +0x7ea
wal.func·002()
    /home/vagrant/influxdb/src/wal/log.go:133 +0x25b
created by wal.(*log).dupAndReplayFromOffset
    /home/vagrant/influxdb/src/wal/log.go:134 +0x16c

Caused by: proto: required field "{Unknown}" not set

goroutine 1 [running]:
runtime.panic(0x857fa0, 0xc2100fb780)
    /home/vagrant/bin/go/src/pkg/runtime/panic.c:266 +0xb6
wal.(*WAL).SetServerId(0xc210078000, 0xc200000001)
    /home/vagrant/influxdb/src/wal/wal.go:113 +0x122
server.(*Server).ListenAndServe(0xc2100c5930, 0xc2100c5930, 0x0)
    /home/vagrant/influxdb/src/server/server.go:87 +0x10d
main.main()
    /home/vagrant/influxdb/src/daemon/influxd.go:119 +0x5fe

goroutine 3 [syscall]:
os/signal.loop()
    /home/vagrant/bin/go/src/pkg/os/signal/signal_unix.go:21 +0x1e
created by os/signal.init·1
    /home/vagrant/bin/go/src/pkg/os/signal/signal_unix.go:27 +0x31

goroutine 4 [chan receive]:
code.google.com/p/log4go.ConsoleLogWriter.run(0xc21000b160, 0x7f569b73e110, 0xc210000008)
    /home/vagrant/influxdb/src/code.google.com/p/log4go/termlog.go:27 +0x60
created by code.google.com/p/log4go.NewConsoleLogWriter
    /home/vagrant/influxdb/src/code.google.com/p/log4go/termlog.go:19 +0x67

goroutine 5 [runnable]:
time.absDate(0x7ffffffe6e419bec, 0xf43fd01, 0x101cc20, 0x7ffffffe6e419bec, 0x11009b840, ...)
    /home/vagrant/bin/go/src/pkg/time/time.go:681
time.Time.date(0xecaf9c9ec, 0xf43fdb7, 0x101cc20, 0x5367d201, 0xf43fdb7, ...)
    /home/vagrant/bin/go/src/pkg/time/time.go:677 +0x58
time.Time.Day(0xecaf9c9ec, 0xf43fdb7, 0x101cc20, 0x7f569b5b6e9f)
    /home/vagrant/bin/go/src/pkg/time/time.go:311 +0x40
code.google.com/p/log4go.func·002()
    /home/vagrant/influxdb/src/code.google.com/p/log4go/filelog.go:97 +0x81c
created by code.google.com/p/log4go.NewFileLogWriter
    /home/vagrant/influxdb/src/code.google.com/p/log4go/filelog.go:116 +0x2d1

goroutine 6 [syscall]:
runtime.goexit()
    /home/vagrant/bin/go/src/pkg/runtime/proc.c:1394

goroutine 7 [finalizer wait]:
runtime.park(0x450310, 0x101af68, 0x1005988)
    /home/vagrant/bin/go/src/pkg/runtime/proc.c:1342 +0x66
runfinq()
    /home/vagrant/bin/go/src/pkg/runtime/mgc0.c:2279 +0x84
runtime.goexit()
    /home/vagrant/bin/go/src/pkg/runtime/proc.c:1394

goroutine 8 [chan receive]:
wal.(*WAL).processEntries(0xc210078000)
    /home/vagrant/influxdb/src/wal/wal.go:242 +0x3f
created by wal.NewWAL
    /home/vagrant/influxdb/src/wal/wal.go:103 +0x9f3

goroutine 9 [sleep]:
time.Sleep(0x8bb2c97000)
    /tmp/makerelease886106415/go/src/pkg/runtime/time.goc:31 +0x31
cluster.func·001()
    /home/vagrant/influxdb/src/cluster/cluster_configuration.go:131 +0x35
created by cluster.(*ClusterConfiguration).CreateFutureShardsAutomaticallyBeforeTimeComes
    /home/vagrant/influxdb/src/cluster/cluster_configuration.go:136 +0x63

goroutine 11 [chan receive]:
main.waitForSignals(0x7f569b740040, 0xc2100c5930)
    /home/vagrant/influxdb/src/daemon/null_profiler.go:23 +0x126
created by main.startProfiler
    /home/vagrant/influxdb/src/daemon/null_profiler.go:15 +0x38

goroutine 12 [IO wait]:
net.runtime_pollWait(0x7f569b740fb8, 0x72, 0x0)
    /tmp/makerelease886106415/go/src/pkg/runtime/netpoll.goc:116 +0x6a
net.(*pollDesc).Wait(0xc210077060, 0x72, 0x7f569b73df88, 0xb)
    /home/vagrant/bin/go/src/pkg/net/fd_poll_runtime.go:81 +0x34
net.(*pollDesc).WaitRead(0xc210077060, 0xb, 0x7f569b73df88)
    /home/vagrant/bin/go/src/pkg/net/fd_poll_runtime.go:86 +0x30
net.(*netFD).accept(0xc210077000, 0x9f6030, 0x0, 0x7f569b73df88, 0xb)
    /home/vagrant/bin/go/src/pkg/net/fd_unix.go:382 +0x2c2
net.(*TCPListener).AcceptTCP(0xc210000078, 0xc21009c020, 0x0, 0x7f569b740090)
    /home/vagrant/bin/go/src/pkg/net/tcpsock_posix.go:233 +0x47
net.(*TCPListener).Accept(0xc210000078, 0xc21009c020, 0x7f5698668f38, 0x1, 0x1)
    /home/vagrant/bin/go/src/pkg/net/tcpsock_posix.go:243 +0x27
coordinator.(*ProtobufServer).ListenAndServe(0xc2100bb880)
    /home/vagrant/influxdb/src/coordinator/protobuf_server.go:62 +0x1c7
created by server.(*Server).ListenAndServe
    /home/vagrant/influxdb/src/server/server.go:78 +0x3d

goroutine 13 [IO wait]:
net.runtime_pollWait(0x7f569b741060, 0x72, 0x0)
    /tmp/makerelease886106415/go/src/pkg/runtime/netpoll.goc:116 +0x6a
net.(*pollDesc).Wait(0xc2100c5a00, 0x72, 0x7f569b73df88, 0xb)
    /home/vagrant/bin/go/src/pkg/net/fd_poll_runtime.go:81 +0x34
net.(*pollDesc).WaitRead(0xc2100c5a00, 0xb, 0x7f569b73df88)
    /home/vagrant/bin/go/src/pkg/net/fd_poll_runtime.go:86 +0x30
net.(*netFD).accept(0xc2100c59a0, 0x9f6030, 0x0, 0x7f569b73df88, 0xb)
    /home/vagrant/bin/go/src/pkg/net/fd_unix.go:382 +0x2c2
net.(*TCPListener).AcceptTCP(0xc2100c6518, 0x18, 0xc210107810, 0x5c7bc3)
    /home/vagrant/bin/go/src/pkg/net/tcpsock_posix.go:233 +0x47
net.(*TCPListener).Accept(0xc2100c6518, 0x0, 0x0, 0x0, 0x0)
    /home/vagrant/bin/go/src/pkg/net/tcpsock_posix.go:243 +0x27
net/http.(*Server).Serve(0xc2100c81e0, 0x7f569b7400c0, 0xc2100c6518, 0x0, 0x0)
    /home/vagrant/bin/go/src/pkg/net/http/server.go:1622 +0x91
coordinator.func·008()
    /home/vagrant/influxdb/src/coordinator/raft_server.go:500 +0x3a
created by coordinator.(*RaftServer).Serve
    /home/vagrant/influxdb/src/coordinator/raft_server.go:504 +0x519

goroutine 15 [select]:
github.com/goraft/raft.(*server).followerLoop(0xc2100bc240)
    /home/vagrant/influxdb/src/github.com/goraft/raft/server.go:613 +0x934
github.com/goraft/raft.(*server).loop(0xc2100bc240)
    /home/vagrant/influxdb/src/github.com/goraft/raft/server.go:564 +0x2e9
created by github.com/goraft/raft.(*server).Start
    /home/vagrant/influxdb/src/github.com/goraft/raft/server.go:472 +0x7af

goroutine 16 [select]:
coordinator.(*RaftServer).CompactLog(0xc2100da0c0)
    /home/vagrant/influxdb/src/coordinator/raft_server.go:300 +0x2ef
created by coordinator.(*RaftServer).startRaft
    /home/vagrant/influxdb/src/coordinator/raft_server.go:338 +0x38f

@jvshahid
Copy link
Contributor

jvshahid commented May 5, 2014

@wladekb can you zip your data and send it to support at influxdb dot com

@wladekb
Copy link

wladekb commented May 5, 2014

@jvshahid do you really want me to send you 11GB via email?

@jvshahid
Copy link
Contributor

jvshahid commented May 5, 2014

I'm only interested in the WAL, especially log.38100001 how big is it ?

@wladekb
Copy link

wladekb commented May 5, 2014

@jvshahid I sent WAL and a few other files, did you get it?

@wladekb
Copy link

wladekb commented May 5, 2014

Issue is still valid after upgrading to 0.6.0

[2014/05/05 22:45:42 UTC] [INFO] (main.setupLogging:53) Redirectoring logging to /opt/influxdb/shared/log.txt
[2014/05/05 22:45:42 UTC] [INFO] (main.main:117) Starting Influx Server bound to 0.0.0.0 ...
[2014/05/05 22:45:42 UTC] [INFO] (server.NewServer:35) Opening database at /opt/influxdb/shared/data/db
[2014/05/05 22:45:42 UTC] [INFO] (wal.NewWAL:40) Opening wal in /opt/influxdb/shared/data/wal
[2014/05/05 22:45:42 UTC] [INFO] (wal.(*WAL).openLog:360) Opening log file /opt/influxdb/shared/data/wal/log.38100001
[2014/05/05 22:45:42 UTC] [INFO] (wal.(*WAL).openLog:374) Opening index file /opt/influxdb/shared/data/wal/index.38100001
[2014/05/05 22:45:42 UTC] [INFO] (api/http.(*HttpServer).EnableSsl:62) Ssl will be disabled since the ssl port or certificate path weren't set
[2014/05/05 22:45:42 UTC] [INFO] (coordinator.(*RaftServer).Serve:516) Initializing Raft HTTP server
[2014/05/05 22:45:42 UTC] [INFO] (coordinator.(*RaftServer).Serve:527) Raft Server Listening at 0.0.0.0:8090
[2014/05/05 22:45:42 UTC] [INFO] (coordinator.(*RaftServer).startRaft:356) Initializing Raft Server: http://dbstore-s1:8090
[2014/05/05 22:45:42 UTC] [INFO] (cluster.(*ClusterConfiguration).Recovery:535) Recovering the cluster configuration
[2014/05/05 22:45:42 UTC] [INFO] (datastore.(*LevelDbShardDatastore).GetOrCreateShard:123) DATASTORE: opening or creating shard /opt/influxdb/shared/data/db/shard_db/00005
[2014/05/05 22:45:42 UTC] [INFO] (datastore.(*LevelDbShardDatastore).GetOrCreateShard:123) DATASTORE: opening or creating shard /opt/influxdb/shared/data/db/shard_db/00004
[2014/05/05 22:45:42 UTC] [INFO] (datastore.(*LevelDbShardDatastore).GetOrCreateShard:123) DATASTORE: opening or creating shard /opt/influxdb/shared/data/db/shard_db/00003
[2014/05/05 22:45:42 UTC] [INFO] (datastore.(*LevelDbShardDatastore).GetOrCreateShard:123) DATASTORE: opening or creating shard /opt/influxdb/shared/data/db/shard_db/00002
[2014/05/05 22:45:42 UTC] [INFO] (datastore.(*LevelDbShardDatastore).GetOrCreateShard:123) DATASTORE: opening or creating shard /opt/influxdb/shared/data/db/shard_db/00001
[2014/05/05 22:45:42 UTC] [INFO] (coordinator.(*RaftServer).startRaft:377) Recovered from log
[2014/05/05 22:45:42 UTC] [INFO] (server.(*Server).ListenAndServe:87) Waiting for local server to be added
[2014/05/05 22:45:42 UTC] [INFO] (wal.(*WAL).SetServerId:109) Setting server id to 1 and recovering
[2014/05/05 22:45:42 UTC] [INFO] (wal.(*WAL).recover:431) Checking /opt/influxdb/shared/data/wal/log.38100001, last: 2536131, size: 2768896
panic: Replay error. Stacktrace:
goroutine 16 [running]:
common.NewErrorWithStacktrace(0x7f7fc4ea5848, 0xc2101b7540, 0xc2101b7550, 0x1, 0x1, ...)
        /home/vagrant/influxdb/src/common/error_with_stacktrace.go:22 +0x7f
wal.newErrorReplayRequest(0x7f7fc4ea5848, 0xc2101b7540, 0x0)
        /home/vagrant/influxdb/src/wal/replay_request.go:19 +0xc0
wal.(*log).replayFromFileLocation(0xc2100d4c30, 0xc210122028, 0xc2101200c0, 0xc2100d5210, 0xc210121060)
        /home/vagrant/influxdb/src/wal/log.go:254 +0x7ea
wal.func·002()
        /home/vagrant/influxdb/src/wal/log.go:133 +0x25b
created by wal.(*log).dupAndReplayFromOffset
        /home/vagrant/influxdb/src/wal/log.go:134 +0x16c

Caused by: proto: required field "{Unknown}" not set

goroutine 1 [running]:
runtime.panic(0x85ed00, 0xc2100d4fc0)
        /home/vagrant/bin/go/src/pkg/runtime/panic.c:266 +0xb6
wal.(*WAL).SetServerId(0xc210078d00, 0xc200000001)
        /home/vagrant/influxdb/src/wal/wal.go:113 +0x122
server.(*Server).ListenAndServe(0xc2100a9770, 0xc2100a9770, 0x0)
        /home/vagrant/influxdb/src/server/server.go:89 +0xf2
main.main()
        /home/vagrant/influxdb/src/daemon/influxd.go:155 +0xb97

goroutine 3 [syscall]:
os/signal.loop()
        /home/vagrant/bin/go/src/pkg/os/signal/signal_unix.go:21 +0x1e
created by os/signal.init·1
        /home/vagrant/bin/go/src/pkg/os/signal/signal_unix.go:27 +0x31

goroutine 4 [chan receive]:
code.google.com/p/log4go.ConsoleLogWriter.run(0xc210071000, 0x7f7fc4e99110, 0xc210000008)
        /home/vagrant/influxdb/src/code.google.com/p/log4go/termlog.go:27 +0x60
created by code.google.com/p/log4go.NewConsoleLogWriter
        /home/vagrant/influxdb/src/code.google.com/p/log4go/termlog.go:19 +0x67

goroutine 5 [runnable]:
code.google.com/p/log4go.FormatLogRecord(0x9500f0, 0x14, 0xc210176c80, 0x5, 0x1)
        /home/vagrant/influxdb/src/code.google.com/p/log4go/pattlog.go:43 +0xf3
code.google.com/p/log4go.func·002()
        /home/vagrant/influxdb/src/code.google.com/p/log4go/filelog.go:105 +0x54b
created by code.google.com/p/log4go.NewFileLogWriter
        /home/vagrant/influxdb/src/code.google.com/p/log4go/filelog.go:116 +0x2d1

goroutine 6 [syscall]:
runtime.goexit()
        /home/vagrant/bin/go/src/pkg/runtime/proc.c:1394

goroutine 7 [chan receive]:
wal.(*WAL).processEntries(0xc210078d00)
        /home/vagrant/influxdb/src/wal/wal.go:242 +0x3f
created by wal.NewWAL
        /home/vagrant/influxdb/src/wal/wal.go:103 +0x9f3

goroutine 8 [sleep]:
time.Sleep(0x8bb2c97000)
        /tmp/makerelease886106415/go/src/pkg/runtime/time.goc:31 +0x31
cluster.func·001()
        /home/vagrant/influxdb/src/cluster/cluster_configuration.go:132 +0x35
created by cluster.(*ClusterConfiguration).CreateFutureShardsAutomaticallyBeforeTimeComes
        /home/vagrant/influxdb/src/cluster/cluster_configuration.go:137 +0x63

goroutine 10 [chan receive]:
main.waitForSignals(0x7f7fc4e9a250, 0xc2100a9770)
        /home/vagrant/influxdb/src/daemon/null_profiler.go:23 +0x126
created by main.startProfiler
        /home/vagrant/influxdb/src/daemon/null_profiler.go:15 +0x38

goroutine 11 [finalizer wait]:
runtime.park(0x451590, 0x10239f8, 0x100e428)
        /home/vagrant/bin/go/src/pkg/runtime/proc.c:1342 +0x66
runfinq()
        /home/vagrant/bin/go/src/pkg/runtime/mgc0.c:2279 +0x84
runtime.goexit()
        /home/vagrant/bin/go/src/pkg/runtime/proc.c:1394

goroutine 12 [IO wait]:
net.runtime_pollWait(0x7f7fc4e9c270, 0x72, 0x0)
        /tmp/makerelease886106415/go/src/pkg/runtime/netpoll.goc:116 +0x6a
net.(*pollDesc).Wait(0xc2100bc3e0, 0x72, 0x7f7fc4e98f88, 0xb)
        /home/vagrant/bin/go/src/pkg/net/fd_poll_runtime.go:81 +0x34
net.(*pollDesc).WaitRead(0xc2100bc3e0, 0xb, 0x7f7fc4e98f88)
        /home/vagrant/bin/go/src/pkg/net/fd_poll_runtime.go:86 +0x30
net.(*netFD).accept(0xc2100bc380, 0x9fcb20, 0x0, 0x7f7fc4e98f88, 0xb)
        /home/vagrant/bin/go/src/pkg/net/fd_unix.go:382 +0x2c2
net.(*TCPListener).AcceptTCP(0xc210000068, 0x18, 0xc2100d3810, 0x5cb0f3)
        /home/vagrant/bin/go/src/pkg/net/tcpsock_posix.go:233 +0x47
net.(*TCPListener).Accept(0xc210000068, 0x0, 0x0, 0x0, 0x0)
        /home/vagrant/bin/go/src/pkg/net/tcpsock_posix.go:243 +0x27
net/http.(*Server).Serve(0xc2100be050, 0x7f7fc4e9b2d0, 0xc210000068, 0x0, 0x0)
        /home/vagrant/bin/go/src/pkg/net/http/server.go:1622 +0x91
coordinator.func·007()
        /home/vagrant/influxdb/src/coordinator/raft_server.go:530 +0x3a
created by coordinator.(*RaftServer).Serve
        /home/vagrant/influxdb/src/coordinator/raft_server.go:534 +0x4d9

goroutine 14 [select]:
github.com/goraft/raft.(*server).followerLoop(0xc2100597e0)
        /home/vagrant/influxdb/src/github.com/goraft/raft/server.go:613 +0x934
github.com/goraft/raft.(*server).loop(0xc2100597e0)
        /home/vagrant/influxdb/src/github.com/goraft/raft/server.go:564 +0x2e9
created by github.com/goraft/raft.(*server).Start
        /home/vagrant/influxdb/src/github.com/goraft/raft/server.go:472 +0x7af

goroutine 15 [select]:
coordinator.(*RaftServer).CompactLog(0xc2100d5a50)
        /home/vagrant/influxdb/src/coordinator/raft_server.go:320 +0x2ef
created by coordinator.(*RaftServer).startRaft
        /home/vagrant/influxdb/src/coordinator/raft_server.go:374 +0x375

@jvshahid
Copy link
Contributor

jvshahid commented May 6, 2014

@wladekb I didn't get the data, who did you send it to ?

@wladekb
Copy link

wladekb commented May 6, 2014

@jvshahid I sent it to support at influxdb dot com with subject "Issue 369 data dir"

@jvshahid
Copy link
Contributor

jvshahid commented May 6, 2014

How big was the file ? None of us got the email. Is it possible to put on s3 or dropbox.

@wladekb
Copy link

wladekb commented May 6, 2014

18mb zipped with password (had to it due to gmail security policy)

@jvshahid
Copy link
Contributor

jvshahid commented May 6, 2014

Well, we didn't get the email. Can you use google drive, s3, or dropbox. Any of those should be fine with a 18mb file.

@wladekb
Copy link

wladekb commented May 6, 2014

@jvshahid
Copy link
Contributor

jvshahid commented May 6, 2014

Thanks, I have it now. I'll take a look asap and get back to you.

@wladekb
Copy link

wladekb commented May 6, 2014

FYI I stripped all non-most-recent data files from archive. If any of them are needed I still have a copy.

@jvshahid
Copy link
Contributor

jvshahid commented May 6, 2014

@wladekb can you run ls -l on the wal directory and paste the output here. Also, what kind of file system are you using ? It seems like there are extra 0 bytes added at the end of the file to make the size multiples of 4K. Not sure if this is something the fs is doing or InfluxDB is doing.

@wladekb
Copy link

wladekb commented May 7, 2014

root@dbstore-s1:/opt/influxdb/shared/data/wal# ls -l
total 2712
-rw-r--r-- 1 root root     306 May  1 00:14 bookmark
-rw-r--r-- 1 root root     164 May  1 00:14 index.38100001
-rw-r--r-- 1 root root 2768896 May  1 00:15 log.38100001
root@dbstore-s1:/opt/influxdb/shared/data/wal# cat /etc/issue
Ubuntu 12.04.2 LTS \n \l

root@dbstore-s1:/opt/influxdb/shared/data/wal# uname -a
Linux dbstore-s1 3.8.0-26-generic #38~precise2-Ubuntu SMP Thu Jun 20 18:29:36 UTC 2013 x86_64 x86_64 x86_64 GNU/Linux
root@dbstore-s1:/opt/influxdb/shared/data/wal# mount
/dev/sdb2 on / type ext4 (rw,errors=remount-ro)
[...snip...]

btw. it's a physical machine

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment
Labels
None yet
Projects
None yet
Development

No branches or pull requests

5 participants