|
|
@ -207,26 +207,13 @@ func shouldHealObjectOnDisk(xlErr, dataErr error, meta xlMetaV1, quorumModTime t |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
// Heals an object by re-writing corrupt/missing erasure blocks.
|
|
|
|
// Heals an object by re-writing corrupt/missing erasure blocks.
|
|
|
|
func healObject(ctx context.Context, storageDisks []StorageAPI, bucket string, object string, |
|
|
|
func (xl xlObjects) healObject(ctx context.Context, bucket string, object string, |
|
|
|
quorum int, dryRun bool, scanMode madmin.HealScanMode) (result madmin.HealResultItem, err error) { |
|
|
|
partsMetadata []xlMetaV1, errs []error, latestXLMeta xlMetaV1, |
|
|
|
|
|
|
|
dryRun bool, remove bool, scanMode madmin.HealScanMode) (result madmin.HealResultItem, err error) { |
|
|
|
|
|
|
|
|
|
|
|
partsMetadata, errs := readAllXLMetadata(ctx, storageDisks, bucket, object) |
|
|
|
dataBlocks := latestXLMeta.Erasure.DataBlocks |
|
|
|
|
|
|
|
|
|
|
|
errCount := 0 |
|
|
|
storageDisks := xl.getDisks() |
|
|
|
for _, err := range errs { |
|
|
|
|
|
|
|
if err != nil { |
|
|
|
|
|
|
|
errCount++ |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if errCount == len(errs) { |
|
|
|
|
|
|
|
// Only if we get errors from all the disks we return error. Else we need to
|
|
|
|
|
|
|
|
// continue to return filled madmin.HealResultItem struct which includes info
|
|
|
|
|
|
|
|
// on what disks the file is available etc.
|
|
|
|
|
|
|
|
if reducedErr := reduceReadQuorumErrs(ctx, errs, nil, quorum); reducedErr != nil { |
|
|
|
|
|
|
|
return defaultHealResult(storageDisks, errs, bucket, object), toObjectErr(reducedErr, bucket, object) |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
// List of disks having latest version of the object xl.json
|
|
|
|
// List of disks having latest version of the object xl.json
|
|
|
|
// (by modtime).
|
|
|
|
// (by modtime).
|
|
|
@ -237,10 +224,12 @@ func healObject(ctx context.Context, storageDisks []StorageAPI, bucket string, o |
|
|
|
|
|
|
|
|
|
|
|
// Initialize heal result object
|
|
|
|
// Initialize heal result object
|
|
|
|
result = madmin.HealResultItem{ |
|
|
|
result = madmin.HealResultItem{ |
|
|
|
Type: madmin.HealItemObject, |
|
|
|
Type: madmin.HealItemObject, |
|
|
|
Bucket: bucket, |
|
|
|
Bucket: bucket, |
|
|
|
Object: object, |
|
|
|
Object: object, |
|
|
|
DiskCount: len(storageDisks), |
|
|
|
DiskCount: len(storageDisks), |
|
|
|
|
|
|
|
ParityBlocks: latestXLMeta.Erasure.ParityBlocks, |
|
|
|
|
|
|
|
DataBlocks: latestXLMeta.Erasure.DataBlocks, |
|
|
|
|
|
|
|
|
|
|
|
// Initialize object size to -1, so we can detect if we are
|
|
|
|
// Initialize object size to -1, so we can detect if we are
|
|
|
|
// unable to reliably find the object size.
|
|
|
|
// unable to reliably find the object size.
|
|
|
@ -308,11 +297,18 @@ func healObject(ctx context.Context, storageDisks []StorageAPI, bucket string, o |
|
|
|
|
|
|
|
|
|
|
|
// If less than read quorum number of disks have all the parts
|
|
|
|
// If less than read quorum number of disks have all the parts
|
|
|
|
// of the data, we can't reconstruct the erasure-coded data.
|
|
|
|
// of the data, we can't reconstruct the erasure-coded data.
|
|
|
|
if numAvailableDisks < quorum { |
|
|
|
if numAvailableDisks < dataBlocks { |
|
|
|
// Default to most common configuration for erasure
|
|
|
|
// Check if xl.json, and corresponding parts are also missing.
|
|
|
|
// blocks upon returning quorum error.
|
|
|
|
if m, ok := isObjectDangling(partsMetadata, errs, dataErrs); ok { |
|
|
|
result.ParityBlocks = len(storageDisks) / 2 |
|
|
|
writeQuorum := m.Erasure.DataBlocks + 1 |
|
|
|
result.DataBlocks = len(storageDisks) / 2 |
|
|
|
if m.Erasure.DataBlocks == 0 { |
|
|
|
|
|
|
|
writeQuorum = len(storageDisks)/2 + 1 |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
if !dryRun && remove { |
|
|
|
|
|
|
|
err = xl.deleteObject(ctx, bucket, object, writeQuorum, false) |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
return defaultHealResult(latestXLMeta, storageDisks, errs, bucket, object), err |
|
|
|
|
|
|
|
} |
|
|
|
return result, toObjectErr(errXLReadQuorum, bucket, object) |
|
|
|
return result, toObjectErr(errXLReadQuorum, bucket, object) |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
@ -329,7 +325,7 @@ func healObject(ctx context.Context, storageDisks []StorageAPI, bucket string, o |
|
|
|
|
|
|
|
|
|
|
|
// Latest xlMetaV1 for reference. If a valid metadata is not
|
|
|
|
// Latest xlMetaV1 for reference. If a valid metadata is not
|
|
|
|
// present, it is as good as object not found.
|
|
|
|
// present, it is as good as object not found.
|
|
|
|
latestMeta, pErr := pickValidXLMeta(ctx, partsMetadata, modTime, quorum) |
|
|
|
latestMeta, pErr := pickValidXLMeta(ctx, partsMetadata, modTime, dataBlocks) |
|
|
|
if pErr != nil { |
|
|
|
if pErr != nil { |
|
|
|
return result, toObjectErr(pErr, bucket, object) |
|
|
|
return result, toObjectErr(pErr, bucket, object) |
|
|
|
} |
|
|
|
} |
|
|
@ -534,7 +530,7 @@ func (xl xlObjects) healObjectDir(ctx context.Context, bucket, object string, dr |
|
|
|
|
|
|
|
|
|
|
|
// Populates default heal result item entries with possible values when we are returning prematurely.
|
|
|
|
// Populates default heal result item entries with possible values when we are returning prematurely.
|
|
|
|
// This is to ensure that in any circumstance we are not returning empty arrays with wrong values.
|
|
|
|
// This is to ensure that in any circumstance we are not returning empty arrays with wrong values.
|
|
|
|
func defaultHealResult(storageDisks []StorageAPI, errs []error, bucket, object string) madmin.HealResultItem { |
|
|
|
func defaultHealResult(latestXLMeta xlMetaV1, storageDisks []StorageAPI, errs []error, bucket, object string) madmin.HealResultItem { |
|
|
|
// Initialize heal result object
|
|
|
|
// Initialize heal result object
|
|
|
|
result := madmin.HealResultItem{ |
|
|
|
result := madmin.HealResultItem{ |
|
|
|
Type: madmin.HealItemObject, |
|
|
|
Type: madmin.HealItemObject, |
|
|
@ -546,6 +542,9 @@ func defaultHealResult(storageDisks []StorageAPI, errs []error, bucket, object s |
|
|
|
// unable to reliably find the object size.
|
|
|
|
// unable to reliably find the object size.
|
|
|
|
ObjectSize: -1, |
|
|
|
ObjectSize: -1, |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
if latestXLMeta.IsValid() { |
|
|
|
|
|
|
|
result.ObjectSize = latestXLMeta.Stat.Size |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
for index, disk := range storageDisks { |
|
|
|
for index, disk := range storageDisks { |
|
|
|
if disk == nil { |
|
|
|
if disk == nil { |
|
|
@ -577,9 +576,14 @@ func defaultHealResult(storageDisks []StorageAPI, errs []error, bucket, object s |
|
|
|
}) |
|
|
|
}) |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
// Default to most common configuration for erasure blocks.
|
|
|
|
if !latestXLMeta.IsValid() { |
|
|
|
result.ParityBlocks = len(storageDisks) / 2 |
|
|
|
// Default to most common configuration for erasure blocks.
|
|
|
|
result.DataBlocks = len(storageDisks) / 2 |
|
|
|
result.ParityBlocks = len(storageDisks) / 2 |
|
|
|
|
|
|
|
result.DataBlocks = len(storageDisks) / 2 |
|
|
|
|
|
|
|
} else { |
|
|
|
|
|
|
|
result.ParityBlocks = latestXLMeta.Erasure.ParityBlocks |
|
|
|
|
|
|
|
result.DataBlocks = latestXLMeta.Erasure.DataBlocks |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
return result |
|
|
|
return result |
|
|
|
} |
|
|
|
} |
|
|
@ -587,7 +591,7 @@ func defaultHealResult(storageDisks []StorageAPI, errs []error, bucket, object s |
|
|
|
// Object is considered dangling/corrupted if any only
|
|
|
|
// Object is considered dangling/corrupted if any only
|
|
|
|
// if total disks - a combination of corrupted and missing
|
|
|
|
// if total disks - a combination of corrupted and missing
|
|
|
|
// files is lesser than number of data blocks.
|
|
|
|
// files is lesser than number of data blocks.
|
|
|
|
func (xl xlObjects) isObjectDangling(metaArr []xlMetaV1, errs []error) (validMeta xlMetaV1, ok bool) { |
|
|
|
func isObjectDangling(metaArr []xlMetaV1, errs []error, dataErrs []error) (validMeta xlMetaV1, ok bool) { |
|
|
|
// We can consider an object data not reliable
|
|
|
|
// We can consider an object data not reliable
|
|
|
|
// when xl.json is not found in read quorum disks.
|
|
|
|
// when xl.json is not found in read quorum disks.
|
|
|
|
// or when xl.json is not readable in read quorum disks.
|
|
|
|
// or when xl.json is not readable in read quorum disks.
|
|
|
@ -599,6 +603,18 @@ func (xl xlObjects) isObjectDangling(metaArr []xlMetaV1, errs []error) (validMet |
|
|
|
corruptedXLJSON++ |
|
|
|
corruptedXLJSON++ |
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
var notFoundParts int |
|
|
|
|
|
|
|
for i := range dataErrs { |
|
|
|
|
|
|
|
// Only count part errors, if the error is not
|
|
|
|
|
|
|
|
// same as xl.json error. This is to avoid
|
|
|
|
|
|
|
|
// double counting when both parts and xl.json
|
|
|
|
|
|
|
|
// are not available.
|
|
|
|
|
|
|
|
if errs[i] != dataErrs[i] { |
|
|
|
|
|
|
|
if dataErrs[i] == errFileNotFound { |
|
|
|
|
|
|
|
notFoundParts++ |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
for _, m := range metaArr { |
|
|
|
for _, m := range metaArr { |
|
|
|
if !m.IsValid() { |
|
|
|
if !m.IsValid() { |
|
|
@ -613,15 +629,11 @@ func (xl xlObjects) isObjectDangling(metaArr []xlMetaV1, errs []error) (validMet |
|
|
|
return validMeta, true |
|
|
|
return validMeta, true |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
// We have valid meta, now verify if we have enough files with data blocks.
|
|
|
|
// We have valid meta, now verify if we have enough files with parity blocks.
|
|
|
|
return validMeta, (len(xl.getDisks()) - corruptedXLJSON - notFoundXLJSON) < validMeta.Erasure.DataBlocks |
|
|
|
return validMeta, corruptedXLJSON+notFoundXLJSON+notFoundParts > validMeta.Erasure.ParityBlocks |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
// HealObject - heal the given object.
|
|
|
|
// HealObject - heal the given object, automatically deletes the object if stale/corrupted if `remove` is true.
|
|
|
|
//
|
|
|
|
|
|
|
|
// FIXME: If an object object was deleted and one disk was down,
|
|
|
|
|
|
|
|
// and later the disk comes back up again, heal on the object
|
|
|
|
|
|
|
|
// should delete it.
|
|
|
|
|
|
|
|
func (xl xlObjects) HealObject(ctx context.Context, bucket, object string, dryRun bool, remove bool, scanMode madmin.HealScanMode) (hr madmin.HealResultItem, err error) { |
|
|
|
func (xl xlObjects) HealObject(ctx context.Context, bucket, object string, dryRun bool, remove bool, scanMode madmin.HealScanMode) (hr madmin.HealResultItem, err error) { |
|
|
|
// Create context that also contains information about the object and bucket.
|
|
|
|
// Create context that also contains information about the object and bucket.
|
|
|
|
// The top level handler might not have this information.
|
|
|
|
// The top level handler might not have this information.
|
|
|
@ -641,13 +653,12 @@ func (xl xlObjects) HealObject(ctx context.Context, bucket, object string, dryRu |
|
|
|
|
|
|
|
|
|
|
|
storageDisks := xl.getDisks() |
|
|
|
storageDisks := xl.getDisks() |
|
|
|
|
|
|
|
|
|
|
|
// FIXME: Metadata is read again in the healObject() call below.
|
|
|
|
|
|
|
|
// Read metadata files from all the disks
|
|
|
|
// Read metadata files from all the disks
|
|
|
|
partsMetadata, errs := readAllXLMetadata(healCtx, storageDisks, bucket, object) |
|
|
|
partsMetadata, errs := readAllXLMetadata(healCtx, storageDisks, bucket, object) |
|
|
|
|
|
|
|
|
|
|
|
// Check if the object is dangling, if yes and user requested
|
|
|
|
// Check if the object is dangling, if yes and user requested
|
|
|
|
// remove we simply delete it from namespace.
|
|
|
|
// remove we simply delete it from namespace.
|
|
|
|
if m, ok := xl.isObjectDangling(partsMetadata, errs); ok { |
|
|
|
if m, ok := isObjectDangling(partsMetadata, errs, []error{}); ok { |
|
|
|
writeQuorum := m.Erasure.DataBlocks + 1 |
|
|
|
writeQuorum := m.Erasure.DataBlocks + 1 |
|
|
|
if m.Erasure.DataBlocks == 0 { |
|
|
|
if m.Erasure.DataBlocks == 0 { |
|
|
|
writeQuorum = len(xl.getDisks())/2 + 1 |
|
|
|
writeQuorum = len(xl.getDisks())/2 + 1 |
|
|
@ -655,21 +666,46 @@ func (xl xlObjects) HealObject(ctx context.Context, bucket, object string, dryRu |
|
|
|
if !dryRun && remove { |
|
|
|
if !dryRun && remove { |
|
|
|
err = xl.deleteObject(healCtx, bucket, object, writeQuorum, false) |
|
|
|
err = xl.deleteObject(healCtx, bucket, object, writeQuorum, false) |
|
|
|
} |
|
|
|
} |
|
|
|
return defaultHealResult(storageDisks, errs, bucket, object), err |
|
|
|
return defaultHealResult(xlMetaV1{}, storageDisks, errs, bucket, object), err |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
latestXLMeta, err := getLatestXLMeta(healCtx, partsMetadata, errs) |
|
|
|
latestXLMeta, err := getLatestXLMeta(healCtx, partsMetadata, errs) |
|
|
|
if err != nil { |
|
|
|
if err != nil { |
|
|
|
return defaultHealResult(storageDisks, errs, bucket, object), toObjectErr(err, bucket, object) |
|
|
|
return defaultHealResult(xlMetaV1{}, storageDisks, errs, bucket, object), toObjectErr(err, bucket, object) |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
// Lock the object before healing.
|
|
|
|
// Lock the object before healing.
|
|
|
|
objectLock := xl.nsMutex.NewNSLock(bucket, object) |
|
|
|
objectLock := xl.nsMutex.NewNSLock(bucket, object) |
|
|
|
if lerr := objectLock.GetRLock(globalHealingTimeout); lerr != nil { |
|
|
|
if lerr := objectLock.GetRLock(globalHealingTimeout); lerr != nil { |
|
|
|
return defaultHealResult(storageDisks, errs, bucket, object), lerr |
|
|
|
return defaultHealResult(latestXLMeta, storageDisks, errs, bucket, object), lerr |
|
|
|
} |
|
|
|
} |
|
|
|
defer objectLock.RUnlock() |
|
|
|
defer objectLock.RUnlock() |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
errCount := 0 |
|
|
|
|
|
|
|
for _, err := range errs { |
|
|
|
|
|
|
|
if err != nil { |
|
|
|
|
|
|
|
errCount++ |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if errCount == len(errs) { |
|
|
|
|
|
|
|
// Only if we get errors from all the disks we return error. Else we need to
|
|
|
|
|
|
|
|
// continue to return filled madmin.HealResultItem struct which includes info
|
|
|
|
|
|
|
|
// on what disks the file is available etc.
|
|
|
|
|
|
|
|
if reducedErr := reduceReadQuorumErrs(ctx, errs, nil, latestXLMeta.Erasure.DataBlocks); reducedErr != nil { |
|
|
|
|
|
|
|
if m, ok := isObjectDangling(partsMetadata, errs, []error{}); ok { |
|
|
|
|
|
|
|
writeQuorum := m.Erasure.DataBlocks + 1 |
|
|
|
|
|
|
|
if m.Erasure.DataBlocks == 0 { |
|
|
|
|
|
|
|
writeQuorum = len(storageDisks)/2 + 1 |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
if !dryRun && remove { |
|
|
|
|
|
|
|
err = xl.deleteObject(ctx, bucket, object, writeQuorum, false) |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
return defaultHealResult(latestXLMeta, storageDisks, errs, bucket, object), toObjectErr(reducedErr, bucket, object) |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
// Heal the object.
|
|
|
|
// Heal the object.
|
|
|
|
return healObject(healCtx, xl.getDisks(), bucket, object, latestXLMeta.Erasure.DataBlocks, dryRun, scanMode) |
|
|
|
return xl.healObject(healCtx, bucket, object, partsMetadata, errs, latestXLMeta, dryRun, remove, scanMode) |
|
|
|
} |
|
|
|
} |
|
|
|