2020-04-05 14:20:50 +08:00
|
|
|
// Copyright 2020 The Gitea Authors. All rights reserved.
|
2022-11-28 02:20:29 +08:00
|
|
|
// SPDX-License-Identifier: MIT
|
2020-04-05 14:20:50 +08:00
|
|
|
|
2016-12-26 09:16:37 +08:00
|
|
|
package lfs
|
|
|
|
|
|
|
|
import (
|
|
|
|
"encoding/hex"
|
|
|
|
"errors"
|
2021-03-07 04:21:56 +08:00
|
|
|
"hash"
|
2016-12-26 09:16:37 +08:00
|
|
|
"io"
|
|
|
|
"os"
|
2017-11-08 21:04:19 +08:00
|
|
|
|
2020-03-10 03:56:18 +08:00
|
|
|
"code.gitea.io/gitea/modules/log"
|
2020-09-08 23:45:10 +08:00
|
|
|
"code.gitea.io/gitea/modules/storage"
|
2023-02-23 03:21:46 +08:00
|
|
|
|
|
|
|
"github.com/minio/sha256-simd"
|
2016-12-26 09:16:37 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
var (
|
2021-04-09 06:25:57 +08:00
|
|
|
// ErrHashMismatch occurs if the content has does not match OID
|
2023-05-09 15:34:36 +08:00
|
|
|
ErrHashMismatch = errors.New("content hash does not match OID")
|
2021-04-09 06:25:57 +08:00
|
|
|
// ErrSizeMismatch occurs if the content size does not match
|
2023-05-09 15:34:36 +08:00
|
|
|
ErrSizeMismatch = errors.New("content size does not match")
|
2016-12-26 09:16:37 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
// ContentStore provides a simple file system based storage.
|
|
|
|
type ContentStore struct {
|
2020-09-08 23:45:10 +08:00
|
|
|
storage.ObjectStorage
|
2016-12-26 09:16:37 +08:00
|
|
|
}
|
|
|
|
|
2021-04-09 06:25:57 +08:00
|
|
|
// NewContentStore creates the default ContentStore
|
|
|
|
func NewContentStore() *ContentStore {
|
|
|
|
contentStore := &ContentStore{ObjectStorage: storage.LFS}
|
|
|
|
return contentStore
|
|
|
|
}
|
|
|
|
|
2017-03-15 08:52:01 +08:00
|
|
|
// Get takes a Meta object and retrieves the content from the store, returning
|
2021-04-06 21:22:34 +08:00
|
|
|
// it as an io.ReadSeekCloser.
|
2021-04-09 06:25:57 +08:00
|
|
|
func (s *ContentStore) Get(pointer Pointer) (storage.Object, error) {
|
|
|
|
f, err := s.Open(pointer.RelativePath())
|
2016-12-26 09:16:37 +08:00
|
|
|
if err != nil {
|
2021-04-09 06:25:57 +08:00
|
|
|
log.Error("Whilst trying to read LFS OID[%s]: Unable to open Error: %v", pointer.Oid, err)
|
2016-12-26 09:16:37 +08:00
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return f, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// Put takes a Meta object and an io.Reader and writes the content to the store.
|
2021-04-09 06:25:57 +08:00
|
|
|
func (s *ContentStore) Put(pointer Pointer, r io.Reader) error {
|
|
|
|
p := pointer.RelativePath()
|
2021-03-07 04:21:56 +08:00
|
|
|
|
|
|
|
// Wrap the provided reader with an inline hashing and size checker
|
2021-04-09 06:25:57 +08:00
|
|
|
wrappedRd := newHashingReader(pointer.Size, pointer.Oid, r)
|
2021-03-07 04:21:56 +08:00
|
|
|
|
|
|
|
// now pass the wrapped reader to Save - if there is a size mismatch or hash mismatch then
|
|
|
|
// the errors returned by the newHashingReader should percolate up to here
|
2021-04-09 06:25:57 +08:00
|
|
|
written, err := s.Save(p, wrappedRd, pointer.Size)
|
2016-12-26 09:16:37 +08:00
|
|
|
if err != nil {
|
2021-04-09 06:25:57 +08:00
|
|
|
log.Error("Whilst putting LFS OID[%s]: Failed to copy to tmpPath: %s Error: %v", pointer.Oid, p, err)
|
2016-12-26 09:16:37 +08:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-03-28 23:10:24 +08:00
|
|
|
// check again whether there is any error during the Save operation
|
|
|
|
// because some errors might be ignored by the Reader's caller
|
|
|
|
if wrappedRd.lastError != nil && !errors.Is(wrappedRd.lastError, io.EOF) {
|
|
|
|
err = wrappedRd.lastError
|
|
|
|
} else if written != pointer.Size {
|
|
|
|
err = ErrSizeMismatch
|
|
|
|
}
|
|
|
|
|
|
|
|
// if the upload failed, try to delete the file
|
|
|
|
if err != nil {
|
|
|
|
if errDel := s.Delete(p); errDel != nil {
|
|
|
|
log.Error("Cleaning the LFS OID[%s] failed: %v", pointer.Oid, errDel)
|
2020-09-08 23:45:10 +08:00
|
|
|
}
|
2016-12-26 09:16:37 +08:00
|
|
|
}
|
|
|
|
|
2023-03-28 23:10:24 +08:00
|
|
|
return err
|
2016-12-26 09:16:37 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Exists returns true if the object exists in the content store.
|
2021-04-09 06:25:57 +08:00
|
|
|
func (s *ContentStore) Exists(pointer Pointer) (bool, error) {
|
|
|
|
_, err := s.ObjectStorage.Stat(pointer.RelativePath())
|
2020-09-08 23:45:10 +08:00
|
|
|
if err != nil {
|
|
|
|
if os.IsNotExist(err) {
|
|
|
|
return false, nil
|
|
|
|
}
|
|
|
|
return false, err
|
2016-12-26 09:16:37 +08:00
|
|
|
}
|
2020-09-08 23:45:10 +08:00
|
|
|
return true, nil
|
2016-12-26 09:16:37 +08:00
|
|
|
}
|
|
|
|
|
2017-11-08 21:04:19 +08:00
|
|
|
// Verify returns true if the object exists in the content store and size is correct.
|
2021-04-09 06:25:57 +08:00
|
|
|
func (s *ContentStore) Verify(pointer Pointer) (bool, error) {
|
|
|
|
p := pointer.RelativePath()
|
2020-09-08 23:45:10 +08:00
|
|
|
fi, err := s.ObjectStorage.Stat(p)
|
2021-04-09 06:25:57 +08:00
|
|
|
if os.IsNotExist(err) || (err == nil && fi.Size() != pointer.Size) {
|
2017-11-08 21:04:19 +08:00
|
|
|
return false, nil
|
|
|
|
} else if err != nil {
|
2021-04-09 06:25:57 +08:00
|
|
|
log.Error("Unable stat file: %s for LFS OID[%s] Error: %v", p, pointer.Oid, err)
|
2017-11-08 21:04:19 +08:00
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return true, nil
|
|
|
|
}
|
2021-03-07 04:21:56 +08:00
|
|
|
|
2022-06-12 23:51:54 +08:00
|
|
|
// ReadMetaObject will read a git_model.LFSMetaObject and return a reader
|
2023-05-09 15:34:36 +08:00
|
|
|
func ReadMetaObject(pointer Pointer) (io.ReadSeekCloser, error) {
|
2021-04-09 06:25:57 +08:00
|
|
|
contentStore := NewContentStore()
|
|
|
|
return contentStore.Get(pointer)
|
|
|
|
}
|
|
|
|
|
2021-03-07 04:21:56 +08:00
|
|
|
type hashingReader struct {
|
|
|
|
internal io.Reader
|
|
|
|
currentSize int64
|
|
|
|
expectedSize int64
|
|
|
|
hash hash.Hash
|
|
|
|
expectedHash string
|
2023-03-28 23:10:24 +08:00
|
|
|
lastError error
|
|
|
|
}
|
|
|
|
|
|
|
|
// recordError records the last error during the Save operation
|
|
|
|
// Some callers of the Reader doesn't respect the returned "err"
|
|
|
|
// For example, MinIO's Put will ignore errors if the written size could equal to expected size
|
|
|
|
// So we must remember the error by ourselves,
|
|
|
|
// and later check again whether ErrSizeMismatch or ErrHashMismatch occurs during the Save operation
|
|
|
|
func (r *hashingReader) recordError(err error) error {
|
|
|
|
r.lastError = err
|
|
|
|
return err
|
2021-03-07 04:21:56 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
func (r *hashingReader) Read(b []byte) (int, error) {
|
|
|
|
n, err := r.internal.Read(b)
|
|
|
|
|
|
|
|
if n > 0 {
|
|
|
|
r.currentSize += int64(n)
|
|
|
|
wn, werr := r.hash.Write(b[:n])
|
|
|
|
if wn != n || werr != nil {
|
2023-03-28 23:10:24 +08:00
|
|
|
return n, r.recordError(werr)
|
2021-03-07 04:21:56 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-03-28 23:10:24 +08:00
|
|
|
if errors.Is(err, io.EOF) || r.currentSize >= r.expectedSize {
|
2021-03-07 04:21:56 +08:00
|
|
|
if r.currentSize != r.expectedSize {
|
2023-03-28 23:10:24 +08:00
|
|
|
return n, r.recordError(ErrSizeMismatch)
|
2021-03-07 04:21:56 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
shaStr := hex.EncodeToString(r.hash.Sum(nil))
|
|
|
|
if shaStr != r.expectedHash {
|
2023-03-28 23:10:24 +08:00
|
|
|
return n, r.recordError(ErrHashMismatch)
|
2021-03-07 04:21:56 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-03-28 23:10:24 +08:00
|
|
|
return n, r.recordError(err)
|
2021-03-07 04:21:56 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
func newHashingReader(expectedSize int64, expectedHash string, reader io.Reader) *hashingReader {
|
|
|
|
return &hashingReader{
|
|
|
|
internal: reader,
|
|
|
|
expectedSize: expectedSize,
|
|
|
|
expectedHash: expectedHash,
|
|
|
|
hash: sha256.New(),
|
|
|
|
}
|
|
|
|
}
|