It’s doing it again! Everytime I start the service on this particular machine (4 processes), at least one or two processes complain about Must be unbuffered
. I tried stopping the service, removing all previous data, restarting, doing configure new single ssd
and everytime I restart the services, I get the same result.
The pattern I see is a StorageServerTerminated
event, followed by a bunch of CoroStop
, then a AllAlternativesFailed
and finally FileOpenError
/KVDoCloseError
. This time it’s on a .sqlite file.
v6.0.15, 4 processes on single machine, data split between two disks (C: and D:)
Config file:
[fdbmonitor]
restart_delay = 20
[general]
cluster_file=C:\ProgramData\foundationdb\fdb.cluster
[fdbserver]
public_address = auto:$ID
listen_address = public
parentpid = $PID
command=C:\Program Files\foundationdb\bin\fdbserver.exe
datadir=C:\ProgramData\foundationdb\data\$ID
logdir=C:\ProgramData\foundationdb\logs
[fdbserver.4500]
[fdbserver.4501]
[fdbserver.4502]
datadir=D:\foundationdb\data\$ID
[fdbserver.4503]
datadir=D:\foundationdb\data\$ID
[backup-agent]
command=C:\Program Files\foundationdb\bin\backup_agent.exe
logdir=C:\ProgramData\foundationdb\logs
[backup-agent.1]
Log extract:
...
<Event Severity="10" Time="1553945442.597377" Type="TLogJoinedMe" ID="c512472fafc50a3d" TLog="56659ccf2ca43a92" Address="10.0.1.26:4501" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.597377" Type="CoroStop" ID="0000000000000000" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.597377" Type="KVWriterDestroying" ID="b60c68f39e5a077c" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.597377" Type="KVWriterDestroyed" ID="b60c68f39e5a077c" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.600754" Type="KVClose" ID="d9a605321616b006" Del="1" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.600754" Type="WorkPool_Stop" ID="0000000000000000" Workers="1" Idle="1" Work="0" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.600754" Type="WorkPool_Stop" ID="0000000000000000" Workers="64" Idle="64" Work="0" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.600754" Type="StorageServerTerminated" ID="d9a605321616b006" Error="worker_removed" ErrorDescription="Normal worker shut down" ErrorCode="1202" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.605091" Type="CommitAttachID" ID="4ba4f4861037259a" To="8c45ffdb86141495" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.605091" Type="CommitDebug" ID="8c45ffdb86141495" Location="TLog.tLogCommit.BeforeWaitForVersion" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.605091" Type="CommitDebug" ID="8c45ffdb86141495" Location="TLog.tLogCommit.Before" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.605091" Type="CommitDebug" ID="8c45ffdb86141495" Location="TLog.tLogCommit.AfterTLogCommit" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.606858" Type="CommitDebug" ID="8c45ffdb86141495" Location="TLog.tLogCommit.After" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.606858" Type="CoroStop" ID="0000000000000000" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.606858" Type="CoroStop" ID="0000000000000000" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.606858" Type="CoroStop" ID="0000000000000000" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.606858" Type="CoroStop" ID="0000000000000000" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
... same event repeated 10 times....
<Event Severity="10" Time="1553945442.608516" Type="CoroStop" ID="0000000000000000" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.608516" Type="CoroStop" ID="0000000000000000" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.608782" Type="CodeCoverage" ID="0000000000000000" File="DiskQueue.actor.cpp" Line="655" Condition="contents.size() && pushedPageCount()" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.608782" Type="CoroStop" ID="0000000000000000" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
... removed 30+ times same event...
<Event Severity="10" Time="1553945442.609032" Type="CoroStop" ID="0000000000000000" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.609032" Type="CoroStop" ID="0000000000000000" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.609032" Type="CoroStop" ID="0000000000000000" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.609290" Type="AllAlternativesFailed" ID="0000000000000000" Interval="1" Alternatives="bebba47071638ebd" Delay="0.05" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="40" Time="1553945442.609290" Type="FileOpenError" ID="0000000000000000" Reason="Must be unbuffered" Flags="131074" File="D:\foundationdb\data\4503\storage-b60c68f39e5a077c0c974b6d0118c118.sqlite" Backtrace="" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="40" Time="1553945442.609290" Type="KVDoCloseError" ID="b60c68f39e5a077c" Error="io_error" ErrorDescription="Disk i/o operation failed" ErrorCode="1510" Reason="unknown" Backtrace="" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.609290" Type="KVClosed" ID="b60c68f39e5a077c" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.609290" Type="Role" ID="b60c68f39e5a077c" Error="success" ErrorDescription="Success" ErrorCode="0" Transition="End" As="StorageServer" Reason="Error" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" TrackLatestType="Original" />
<Event Severity="10" Time="1553945442.609290" Type="WorkPool_Stop" ID="0000000000000000" Workers="1" Idle="0" Work="0" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.609290" Type="WorkPool_Stop" ID="0000000000000000" Workers="64" Idle="0" Work="0" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.612864" Type="TransactionAttachID" ID="10188f69184bbdef" To="edd39d8b61f68931" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.612864" Type="TransactionDebug" ID="edd39d8b61f68931" Location="TLogServer.TLogConfirmRunningRequest" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.612864" Type="CoroStop" ID="0000000000000000" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.612864" Type="KVWriterDestroying" ID="d9a605321616b006" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.612864" Type="KVWriterDestroyed" ID="d9a605321616b006" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="40" Time="1553945442.616773" Type="FileOpenError" ID="0000000000000000" Reason="Must be unbuffered" Flags="131074" File="D:\foundationdb\data\4503\storage-d9a605321616b0064898aff70659a5a5.sqlite" Backtrace="" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="40" Time="1553945442.616773" Type="KVDoCloseError" ID="d9a605321616b006" Error="io_error" ErrorDescription="Disk i/o operation failed" ErrorCode="1510" Reason="unknown" Backtrace="" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.616773" Type="KVClosed" ID="d9a605321616b006" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.616773" Type="Role" ID="d9a605321616b006" Error="success" ErrorDescription="Success" ErrorCode="0" Transition="End" As="StorageServer" Reason="Error" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" TrackLatestType="Original" />
<Event Severity="10" Time="1553945442.616773" Type="WorkPool_Stop" ID="0000000000000000" Workers="1" Idle="0" Work="0" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.616773" Type="WorkPool_Stop" ID="0000000000000000" Workers="64" Idle="0" Work="0" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.618938" Type="SSTag" ID="ff08bffb954efca7" MyTag="0:2" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
<Event Severity="10" Time="1553945442.618938" Type="StorageServerStartingCore" ID="ff08bffb954efca7" TimeTaken="1.34955" Machine="10.0.1.26:4503" LogGroup="default" Roles="MS,SS,TL" />
...