fsrepo.go 16.7 KB
Newer Older
1 2 3
package fsrepo

import (
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
4 5
	"errors"
	"fmt"
6
	"io"
7
	"os"
Jeromy's avatar
Jeromy committed
8
	"path/filepath"
9
	"strconv"
10
	"strings"
11
	"sync"
12

13
	ds "github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore"
14
	"github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore/flatfs"
15
	levelds "github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore/leveldb"
16
	"github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore/measure"
17
	"github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore/mount"
18 19 20 21 22
	ldbopts "github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/syndtr/goleveldb/leveldb/opt"
	repo "github.com/ipfs/go-ipfs/repo"
	"github.com/ipfs/go-ipfs/repo/common"
	config "github.com/ipfs/go-ipfs/repo/config"
	lockfile "github.com/ipfs/go-ipfs/repo/fsrepo/lock"
23
	mfsr "github.com/ipfs/go-ipfs/repo/fsrepo/migrations"
24 25 26 27
	serialize "github.com/ipfs/go-ipfs/repo/fsrepo/serialize"
	dir "github.com/ipfs/go-ipfs/thirdparty/dir"
	util "github.com/ipfs/go-ipfs/util"
	ds2 "github.com/ipfs/go-ipfs/util/datastore2"
Jeromy's avatar
Jeromy committed
28
	logging "github.com/ipfs/go-ipfs/vendor/QmQg1J6vikuXF9oDvm4wpdeAUvvkVEKW1EYDw9HhTMnP2b/go-log"
29 30
)

Jeromy's avatar
Jeromy committed
31 32
var log = logging.Logger("fsrepo")

33
// version number that we are currently expecting to see
Jeromy's avatar
Jeromy committed
34
var RepoVersion = "3"
35

36 37
var migrationInstructions = `See https://github.com/ipfs/fs-repo-migrations/blob/master/run.md
Sorry for the inconvenience. In the future, these will run automatically.`
38

39 40 41 42 43 44 45 46 47
var errIncorrectRepoFmt = `Repo has incorrect version: %s
Program version is: %s
Please run the ipfs migration tool before continuing.
` + migrationInstructions

var (
	ErrNoVersion = errors.New("no version file found, please run 0-to-1 migration tool.\n" + migrationInstructions)
	ErrOldRepo   = errors.New("ipfs repo found in old '~/.go-ipfs' location, please run migration tool.\n" + migrationInstructions)
)
48

49 50 51 52 53 54 55
type NoRepoError struct {
	Path string
}

var _ error = NoRepoError{}

func (err NoRepoError) Error() string {
rht's avatar
rht committed
56
	return fmt.Sprintf("no ipfs repo found in %s.\nplease run: ipfs init", err.Path)
57 58
}

59
const (
60
	leveldbDirectory = "datastore"
61
	flatfsDirectory  = "blocks"
62
	apiFile          = "api"
63 64
)

65
var (
66 67 68

	// packageLock must be held to while performing any operation that modifies an
	// FSRepo's state field. This includes Init, Open, Close, and Remove.
Tommi Virtanen's avatar
Tommi Virtanen committed
69
	packageLock sync.Mutex
70

71 72 73 74 75 76 77 78 79 80 81 82 83
	// onlyOne keeps track of open FSRepo instances.
	//
	// TODO: once command Context / Repo integration is cleaned up,
	// this can be removed. Right now, this makes ConfigCmd.Run
	// function try to open the repo twice:
	//
	//     $ ipfs daemon &
	//     $ ipfs config foo
	//
	// The reason for the above is that in standalone mode without the
	// daemon, `ipfs config` tries to save work by not building the
	// full IpfsNode, but accessing the Repo directly.
	onlyOne repo.OnlyOne
84 85
)

86 87
// FSRepo represents an IPFS FileSystem Repo. It is safe for use by multiple
// callers.
88
type FSRepo struct {
89 90
	// has Close been called already
	closed bool
Brian Tiger Chow's avatar
Brian Tiger Chow committed
91 92
	// path is the file-system path
	path string
93 94 95
	// lockfile is the file system lock to prevent others from opening
	// the same fsrepo path concurrently
	lockfile io.Closer
96
	config   *config.Config
97
	ds       ds.ThreadSafeDatastore
98 99
}

Tommi Virtanen's avatar
Tommi Virtanen committed
100 101
var _ repo.Repo = (*FSRepo)(nil)

102 103
// Open the FSRepo at path. Returns an error if the repo is not
// initialized.
104 105 106 107 108 109 110 111
func Open(repoPath string) (repo.Repo, error) {
	fn := func() (repo.Repo, error) {
		return open(repoPath)
	}
	return onlyOne.Open(repoPath, fn)
}

func open(repoPath string) (repo.Repo, error) {
112 113 114
	packageLock.Lock()
	defer packageLock.Unlock()

115
	r, err := newFSRepo(repoPath)
116 117 118 119
	if err != nil {
		return nil, err
	}

120 121 122
	// Check if its initialized
	if err := checkInitialized(r.path); err != nil {
		return nil, err
123
	}
Tommi Virtanen's avatar
Tommi Virtanen committed
124

Tommi Virtanen's avatar
Tommi Virtanen committed
125 126 127 128 129 130 131 132 133 134 135 136
	r.lockfile, err = lockfile.Lock(r.path)
	if err != nil {
		return nil, err
	}
	keepLocked := false
	defer func() {
		// unlock on error, leave it locked on success
		if !keepLocked {
			r.lockfile.Close()
		}
	}()

137
	// Check version, and error out if not matching
138
	ver, err := mfsr.RepoPath(r.path).Version()
139 140
	if err != nil {
		if os.IsNotExist(err) {
141
			return nil, ErrNoVersion
142 143 144 145
		}
		return nil, err
	}

146
	if ver != RepoVersion {
147
		return nil, fmt.Errorf(errIncorrectRepoFmt, ver, RepoVersion)
148 149
	}

150 151 152 153 154 155 156 157 158 159 160 161 162
	// check repo path, then check all constituent parts.
	if err := dir.Writable(r.path); err != nil {
		return nil, err
	}

	if err := r.openConfig(); err != nil {
		return nil, err
	}

	if err := r.openDatastore(); err != nil {
		return nil, err
	}

Tommi Virtanen's avatar
Tommi Virtanen committed
163
	keepLocked = true
164
	return r, nil
165 166
}

167
func newFSRepo(rpath string) (*FSRepo, error) {
rht's avatar
rht committed
168
	expPath, err := util.TildeExpansion(filepath.Clean(rpath))
169 170 171 172 173 174 175 176 177 178 179
	if err != nil {
		return nil, err
	}

	return &FSRepo{path: expPath}, nil
}

func checkInitialized(path string) error {
	if !isInitializedUnsynced(path) {
		alt := strings.Replace(path, ".ipfs", ".go-ipfs", 1)
		if isInitializedUnsynced(alt) {
180
			return ErrOldRepo
181
		}
182
		return NoRepoError{Path: path}
183 184 185 186
	}
	return nil
}

187 188 189
// ConfigAt returns an error if the FSRepo at the given path is not
// initialized. This function allows callers to read the config file even when
// another process is running and holding the lock.
Brian Tiger Chow's avatar
huh  
Brian Tiger Chow committed
190
func ConfigAt(repoPath string) (*config.Config, error) {
191 192 193 194 195

	// packageLock must be held to ensure that the Read is atomic.
	packageLock.Lock()
	defer packageLock.Unlock()

Brian Tiger Chow's avatar
huh  
Brian Tiger Chow committed
196 197 198 199
	configFilename, err := config.Filename(repoPath)
	if err != nil {
		return nil, err
	}
200
	return serialize.Load(configFilename)
Brian Tiger Chow's avatar
huh  
Brian Tiger Chow committed
201 202
}

203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232
// configIsInitialized returns true if the repo is initialized at
// provided |path|.
func configIsInitialized(path string) bool {
	configFilename, err := config.Filename(path)
	if err != nil {
		return false
	}
	if !util.FileExists(configFilename) {
		return false
	}
	return true
}

func initConfig(path string, conf *config.Config) error {
	if configIsInitialized(path) {
		return nil
	}
	configFilename, err := config.Filename(path)
	if err != nil {
		return err
	}
	// initialization is the one time when it's okay to write to the config
	// without reading the config from disk and merging any user-provided keys
	// that may exist.
	if err := serialize.WriteConfigFile(configFilename, conf); err != nil {
		return err
	}
	return nil
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
233
// Init initializes a new FSRepo at the given path with the provided config.
234
// TODO add support for custom datastores.
235
func Init(repoPath string, conf *config.Config) error {
236 237 238 239

	// packageLock must be held to ensure that the repo is not initialized more
	// than once.
	packageLock.Lock()
240
	defer packageLock.Unlock()
241

242
	if isInitializedUnsynced(repoPath) {
243 244
		return nil
	}
245

246
	if err := initConfig(repoPath, conf); err != nil {
247 248 249
		return err
	}

250 251
	// The actual datastore contents are initialized lazily when Opened.
	// During Init, we merely check that the directory is writeable.
Jeromy's avatar
Jeromy committed
252
	leveldbPath := filepath.Join(repoPath, leveldbDirectory)
253
	if err := dir.Writable(leveldbPath); err != nil {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
254
		return fmt.Errorf("datastore: %s", err)
255
	}
256

Jeromy's avatar
Jeromy committed
257
	flatfsPath := filepath.Join(repoPath, flatfsDirectory)
258 259 260 261
	if err := dir.Writable(flatfsPath); err != nil {
		return fmt.Errorf("datastore: %s", err)
	}

Jeromy's avatar
Jeromy committed
262
	if err := dir.Writable(filepath.Join(repoPath, "logs")); err != nil {
263 264 265
		return err
	}

266 267 268 269
	if err := mfsr.RepoPath(repoPath).WriteVersion(RepoVersion); err != nil {
		return err
	}

270 271 272
	return nil
}

273
// Remove recursively removes the FSRepo at |path|.
274
func Remove(repoPath string) error {
Jeromy's avatar
Jeromy committed
275
	repoPath = filepath.Clean(repoPath)
276
	return os.RemoveAll(repoPath)
277 278
}

279 280
// LockedByOtherProcess returns true if the FSRepo is locked by another
// process. If true, then the repo cannot be opened by this process.
281
func LockedByOtherProcess(repoPath string) (bool, error) {
Jeromy's avatar
Jeromy committed
282
	repoPath = filepath.Clean(repoPath)
283
	// NB: the lock is only held when repos are Open
284
	return lockfile.Locked(repoPath)
285 286
}

287 288 289 290 291
// APIAddr returns the registered API addr, according to the api file
// in the fsrepo. This is a concurrent operation, meaning that any
// process may read this file. modifying this file, therefore, should
// use "mv" to replace the whole file and avoid interleaved read/writes.
func APIAddr(repoPath string) (string, error) {
Jeromy's avatar
Jeromy committed
292 293
	repoPath = filepath.Clean(repoPath)
	apiFilePath := filepath.Join(repoPath, apiFile)
294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319

	// if there is no file, assume there is no api addr.
	f, err := os.Open(apiFilePath)
	if err != nil {
		if os.IsNotExist(err) {
			return "", repo.ErrApiNotRunning
		}
		return "", err
	}
	defer f.Close()

	// read up to 2048 bytes. io.ReadAll is a vulnerability, as
	// someone could hose the process by putting a massive file there.
	buf := make([]byte, 2048)
	n, err := f.Read(buf)
	if err != nil && err != io.EOF {
		return "", err
	}

	s := string(buf[:n])
	s = strings.TrimSpace(s)
	return s, nil
}

// SetAPIAddr writes the API Addr to the /api file.
func (r *FSRepo) SetAPIAddr(addr string) error {
Jeromy's avatar
Jeromy committed
320
	f, err := os.Create(filepath.Join(r.path, apiFile))
321 322 323 324 325 326 327 328 329
	if err != nil {
		return err
	}
	defer f.Close()

	_, err = f.WriteString(addr)
	return err
}

330 331 332 333 334 335 336 337 338 339 340 341 342 343
// openConfig returns an error if the config file is not present.
func (r *FSRepo) openConfig() error {
	configFilename, err := config.Filename(r.path)
	if err != nil {
		return err
	}
	conf, err := serialize.Load(configFilename)
	if err != nil {
		return err
	}
	r.config = conf
	return nil
}

344 345
// openDatastore returns an error if the config file is not present.
func (r *FSRepo) openDatastore() error {
Jeromy's avatar
Jeromy committed
346
	leveldbPath := filepath.Join(r.path, leveldbDirectory)
347 348
	var err error
	// save leveldb reference so it can be neatly closed afterward
Jeromy's avatar
Jeromy committed
349
	leveldbDS, err := levelds.NewDatastore(leveldbPath, &levelds.Options{
350 351 352
		Compression: ldbopts.NoCompression,
	})
	if err != nil {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
353
		return errors.New("unable to open leveldb datastore")
354
	}
355 356 357 358 359 360 361 362 363

	// 4TB of 256kB objects ~=17M objects, splitting that 256-way
	// leads to ~66k objects per dir, splitting 256*256-way leads to
	// only 256.
	//
	// The keys seen by the block store have predictable prefixes,
	// including "/" from datastore.Key and 2 bytes from multihash. To
	// reach a uniform 256-way split, we need approximately 4 bytes of
	// prefix.
Jeromy's avatar
Jeromy committed
364
	blocksDS, err := flatfs.New(filepath.Join(r.path, flatfsDirectory), 4)
365 366 367 368
	if err != nil {
		return errors.New("unable to open flatfs datastore")
	}

369 370 371 372 373 374 375 376 377 378
	// Add our PeerID to metrics paths to keep them unique
	//
	// As some tests just pass a zero-value Config to fsrepo.Init,
	// cope with missing PeerID.
	id := r.config.Identity.PeerID
	if id == "" {
		// the tests pass in a zero Config; cope with it
		id = fmt.Sprintf("uninitialized_%p", r)
	}
	prefix := "fsrepo." + id + ".datastore."
Jeromy's avatar
Jeromy committed
379 380
	metricsBlocks := measure.New(prefix+"blocks", blocksDS)
	metricsLevelDB := measure.New(prefix+"leveldb", leveldbDS)
381
	mountDS := mount.New([]mount.Mount{
382 383
		{
			Prefix:    ds.NewKey("/blocks"),
Jeromy's avatar
Jeromy committed
384
			Datastore: metricsBlocks,
385 386 387
		},
		{
			Prefix:    ds.NewKey("/"),
Jeromy's avatar
Jeromy committed
388
			Datastore: metricsLevelDB,
389
		},
390 391 392 393 394 395 396
	})
	// Make sure it's ok to claim the virtual datastore from mount as
	// threadsafe. There's no clean way to make mount itself provide
	// this information without copy-pasting the code into two
	// variants. This is the same dilemma as the `[].byte` attempt at
	// introducing const types to Go.
	var _ ds.ThreadSafeDatastore = blocksDS
Jeromy's avatar
Jeromy committed
397
	var _ ds.ThreadSafeDatastore = leveldbDS
398
	r.ds = ds2.ClaimThreadSafe{mountDS}
399 400 401
	return nil
}

402 403 404 405 406
// Close closes the FSRepo, releasing held resources.
func (r *FSRepo) Close() error {
	packageLock.Lock()
	defer packageLock.Unlock()

407
	if r.closed {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
408
		return errors.New("repo is closed")
409
	}
410

Jeromy's avatar
Jeromy committed
411
	if err := r.ds.(io.Closer).Close(); err != nil {
412
		return err
413
	}
414

Jeromy's avatar
Jeromy committed
415 416 417 418 419
	err := os.Remove(filepath.Join(r.path, apiFile))
	if err != nil {
		log.Warning("error removing api file: ", err)
	}

420 421 422 423 424 425
	// This code existed in the previous versions, but
	// EventlogComponent.Close was never called. Preserving here
	// pending further discussion.
	//
	// TODO It isn't part of the current contract, but callers may like for us
	// to disable logging once the component is closed.
Jeromy's avatar
Jeromy committed
426
	// logging.Configure(logging.Output(os.Stderr))
427

428 429 430 431 432
	r.closed = true
	if err := r.lockfile.Close(); err != nil {
		return err
	}
	return nil
433 434
}

435
// Result when not Open is undefined. The method may panic if it pleases.
436
func (r *FSRepo) Config() (*config.Config, error) {
437 438 439 440 441 442 443 444 445

	// It is not necessary to hold the package lock since the repo is in an
	// opened state. The package lock is _not_ meant to ensure that the repo is
	// thread-safe. The package lock is only meant to guard againt removal and
	// coordinate the lockfile. However, we provide thread-safety to keep
	// things simple.
	packageLock.Lock()
	defer packageLock.Unlock()

446
	if r.closed {
447
		return nil, errors.New("cannot access config, repo not open")
448
	}
449
	return r.config, nil
450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476
}

// setConfigUnsynced is for private use.
func (r *FSRepo) setConfigUnsynced(updated *config.Config) error {
	configFilename, err := config.Filename(r.path)
	if err != nil {
		return err
	}
	// to avoid clobbering user-provided keys, must read the config from disk
	// as a map, write the updated struct values to the map and write the map
	// to disk.
	var mapconf map[string]interface{}
	if err := serialize.ReadConfigFile(configFilename, &mapconf); err != nil {
		return err
	}
	m, err := config.ToMap(updated)
	if err != nil {
		return err
	}
	for k, v := range m {
		mapconf[k] = v
	}
	if err := serialize.WriteConfigFile(configFilename, mapconf); err != nil {
		return err
	}
	*r.config = *updated // copy so caller cannot modify this private config
	return nil
477 478
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
479
// SetConfig updates the FSRepo's config.
480
func (r *FSRepo) SetConfig(updated *config.Config) error {
481 482 483 484 485

	// packageLock is held to provide thread-safety.
	packageLock.Lock()
	defer packageLock.Unlock()

486
	return r.setConfigUnsynced(updated)
487 488
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
489
// GetConfigKey retrieves only the value of a particular key.
490
func (r *FSRepo) GetConfigKey(key string) (interface{}, error) {
491 492 493
	packageLock.Lock()
	defer packageLock.Unlock()

494
	if r.closed {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
495
		return nil, errors.New("repo is closed")
496
	}
497 498 499 500 501 502 503 504 505 506

	filename, err := config.Filename(r.path)
	if err != nil {
		return nil, err
	}
	var cfg map[string]interface{}
	if err := serialize.ReadConfigFile(filename, &cfg); err != nil {
		return nil, err
	}
	return common.MapGetKV(cfg, key)
507 508
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
509
// SetConfigKey writes the value of a particular key.
510
func (r *FSRepo) SetConfigKey(key string, value interface{}) error {
511 512 513
	packageLock.Lock()
	defer packageLock.Unlock()

514
	if r.closed {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
515
		return errors.New("repo is closed")
516
	}
517 518 519 520 521 522 523 524 525

	filename, err := config.Filename(r.path)
	if err != nil {
		return err
	}
	var mapconf map[string]interface{}
	if err := serialize.ReadConfigFile(filename, &mapconf); err != nil {
		return err
	}
526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563

	// Get the type of the value associated with the key
	oldValue, err := common.MapGetKV(mapconf, key)
	ok := true
	if err != nil {
		// key-value does not exist yet
		switch v := value.(type) {
		case string:
			value, err = strconv.ParseBool(v)
			if err != nil {
				value, err = strconv.Atoi(v)
				if err != nil {
					value, err = strconv.ParseFloat(v, 32)
					if err != nil {
						value = v
					}
				}
			}
		default:
		}
	} else {
		switch oldValue.(type) {
		case bool:
			value, ok = value.(bool)
		case int:
			value, ok = value.(int)
		case float32:
			value, ok = value.(float32)
		case string:
			value, ok = value.(string)
		default:
			value = value
		}
		if !ok {
			return fmt.Errorf("Wrong config type, expected %T", oldValue)
		}
	}

564 565 566
	if err := common.MapSetKV(mapconf, key, value); err != nil {
		return err
	}
567 568 569

	// This step doubles as to validate the map against the struct
	// before serialization
570 571 572 573 574 575 576 577
	conf, err := config.FromMap(mapconf)
	if err != nil {
		return err
	}
	if err := serialize.WriteConfigFile(filename, mapconf); err != nil {
		return err
	}
	return r.setConfigUnsynced(conf) // TODO roll this into this method
578 579
}

580 581 582 583
// Datastore returns a repo-owned datastore. If FSRepo is Closed, return value
// is undefined.
func (r *FSRepo) Datastore() ds.ThreadSafeDatastore {
	packageLock.Lock()
584
	d := r.ds
585 586 587 588
	packageLock.Unlock()
	return d
}

rht's avatar
rht committed
589 590 591 592 593 594 595 596 597 598 599 600 601 602 603
// GetStorageUsage computes the storage space taken by the repo in bytes
func (r *FSRepo) GetStorageUsage() (uint64, error) {
	pth, err := config.PathRoot()
	if err != nil {
		return 0, err
	}

	var du uint64
	err = filepath.Walk(pth, func(p string, f os.FileInfo, err error) error {
		du += uint64(f.Size())
		return nil
	})
	return du, err
}

604
var _ io.Closer = &FSRepo{}
605
var _ repo.Repo = &FSRepo{}
606

607 608
// IsInitialized returns true if the repo is initialized at provided |path|.
func IsInitialized(path string) bool {
609 610
	// packageLock is held to ensure that another caller doesn't attempt to
	// Init or Remove the repo while this call is in progress.
611 612
	packageLock.Lock()
	defer packageLock.Unlock()
613

614
	return isInitializedUnsynced(path)
615 616
}

617 618
// private methods below this point. NB: packageLock must held by caller.

619
// isInitializedUnsynced reports whether the repo is initialized. Caller must
620
// hold the packageLock.
621 622
func isInitializedUnsynced(repoPath string) bool {
	if !configIsInitialized(repoPath) {
623 624
		return false
	}
625

Jeromy's avatar
Jeromy committed
626
	if !util.FileExists(filepath.Join(repoPath, leveldbDirectory)) {
627
		return false
628
	}
629

630
	return true
631
}