Merge pull request #4235 from renzhengeek/renzhen/fix-iohang
snapshots/devmapper: fix race windown causing IO hangup
This commit is contained in:
commit
80859e8fd8
@ -347,6 +347,16 @@ func (p *PoolDevice) SuspendDevice(ctx context.Context, deviceName string) error
|
|||||||
return nil
|
return nil
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func (p *PoolDevice) ResumeDevice(ctx context.Context, deviceName string) error {
|
||||||
|
if err := p.transition(ctx, deviceName, Resuming, Resumed, func() error {
|
||||||
|
return dmsetup.ResumeDevice(deviceName)
|
||||||
|
}); err != nil {
|
||||||
|
return errors.Wrapf(err, "failed to resume device %q", deviceName)
|
||||||
|
}
|
||||||
|
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
// DeactivateDevice deactivates thin device
|
// DeactivateDevice deactivates thin device
|
||||||
func (p *PoolDevice) DeactivateDevice(ctx context.Context, deviceName string, deferred, withForce bool) error {
|
func (p *PoolDevice) DeactivateDevice(ctx context.Context, deviceName string, deferred, withForce bool) error {
|
||||||
if !p.IsLoaded(deviceName) {
|
if !p.IsLoaded(deviceName) {
|
||||||
|
@ -277,14 +277,26 @@ func (s *Snapshotter) Commit(ctx context.Context, name, key string, opts ...snap
|
|||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
|
|
||||||
// The thin snapshot is not used for IO after committed, so
|
// After committed, the snapshot device will not be directly
|
||||||
// suspend to flush the IO and deactivate the device.
|
// used anymore. We'd better deativate it to make it *invisible*
|
||||||
|
// in userspace, so that tools like LVM2 and fdisk cannot touch it,
|
||||||
|
// and avoid useless IOs on it.
|
||||||
|
//
|
||||||
|
// Before deactivation, we need to flush the outstanding IO by suspend.
|
||||||
|
// Afterward, we resume it again to prevent a race window which may cause
|
||||||
|
// a process IO hang. See the issue below for details:
|
||||||
|
// (https://github.com/containerd/containerd/issues/4234)
|
||||||
err = s.pool.SuspendDevice(ctx, deviceName)
|
err = s.pool.SuspendDevice(ctx, deviceName)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
|
|
||||||
return s.pool.DeactivateDevice(ctx, deviceName, true, false)
|
err = s.pool.ResumeDevice(ctx, deviceName)
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
return s.pool.DeactivateDevice(ctx, deviceName, false, false)
|
||||||
})
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user