fsrepo.go 16 KB
Newer Older
1 2 3
package fsrepo

import (
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
4 5
	"errors"
	"fmt"
6
	"io"
7
	"os"
8
	"path"
9
	"strconv"
10
	"strings"
11
	"sync"
12

13
	ds "github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore"
14
	"github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore/flatfs"
15
	levelds "github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore/leveldb"
16
	"github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore/measure"
17
	"github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore/mount"
18 19 20 21 22
	ldbopts "github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/syndtr/goleveldb/leveldb/opt"
	repo "github.com/ipfs/go-ipfs/repo"
	"github.com/ipfs/go-ipfs/repo/common"
	config "github.com/ipfs/go-ipfs/repo/config"
	lockfile "github.com/ipfs/go-ipfs/repo/fsrepo/lock"
23
	mfsr "github.com/ipfs/go-ipfs/repo/fsrepo/migrations"
24 25 26 27 28
	serialize "github.com/ipfs/go-ipfs/repo/fsrepo/serialize"
	dir "github.com/ipfs/go-ipfs/thirdparty/dir"
	u "github.com/ipfs/go-ipfs/util"
	util "github.com/ipfs/go-ipfs/util"
	ds2 "github.com/ipfs/go-ipfs/util/datastore2"
29 30
)

31
// version number that we are currently expecting to see
32 33
var RepoVersion = "2"

34 35
var migrationInstructions = `See https://github.com/ipfs/fs-repo-migrations/blob/master/run.md
Sorry for the inconvenience. In the future, these will run automatically.`
36

37 38 39 40 41 42 43 44 45
var errIncorrectRepoFmt = `Repo has incorrect version: %s
Program version is: %s
Please run the ipfs migration tool before continuing.
` + migrationInstructions

var (
	ErrNoVersion = errors.New("no version file found, please run 0-to-1 migration tool.\n" + migrationInstructions)
	ErrOldRepo   = errors.New("ipfs repo found in old '~/.go-ipfs' location, please run migration tool.\n" + migrationInstructions)
)
46

47 48 49 50 51 52 53
type NoRepoError struct {
	Path string
}

var _ error = NoRepoError{}

func (err NoRepoError) Error() string {
rht's avatar
rht committed
54
	return fmt.Sprintf("no ipfs repo found in %s.\nplease run: ipfs init", err.Path)
55 56
}

57
const (
58
	leveldbDirectory = "datastore"
59
	flatfsDirectory  = "blocks"
60
	apiFile          = "api"
61 62
)

63
var (
64 65 66

	// packageLock must be held to while performing any operation that modifies an
	// FSRepo's state field. This includes Init, Open, Close, and Remove.
Tommi Virtanen's avatar
Tommi Virtanen committed
67
	packageLock sync.Mutex
68

69 70 71 72 73 74 75 76 77 78 79 80 81
	// onlyOne keeps track of open FSRepo instances.
	//
	// TODO: once command Context / Repo integration is cleaned up,
	// this can be removed. Right now, this makes ConfigCmd.Run
	// function try to open the repo twice:
	//
	//     $ ipfs daemon &
	//     $ ipfs config foo
	//
	// The reason for the above is that in standalone mode without the
	// daemon, `ipfs config` tries to save work by not building the
	// full IpfsNode, but accessing the Repo directly.
	onlyOne repo.OnlyOne
82 83
)

84 85
// FSRepo represents an IPFS FileSystem Repo. It is safe for use by multiple
// callers.
86
type FSRepo struct {
87 88
	// has Close been called already
	closed bool
Brian Tiger Chow's avatar
Brian Tiger Chow committed
89 90
	// path is the file-system path
	path string
91 92 93
	// lockfile is the file system lock to prevent others from opening
	// the same fsrepo path concurrently
	lockfile io.Closer
94
	config   *config.Config
95
	ds       ds.ThreadSafeDatastore
96 97
}

Tommi Virtanen's avatar
Tommi Virtanen committed
98 99
var _ repo.Repo = (*FSRepo)(nil)

100 101
// Open the FSRepo at path. Returns an error if the repo is not
// initialized.
102 103 104 105 106 107 108 109
func Open(repoPath string) (repo.Repo, error) {
	fn := func() (repo.Repo, error) {
		return open(repoPath)
	}
	return onlyOne.Open(repoPath, fn)
}

func open(repoPath string) (repo.Repo, error) {
110 111 112
	packageLock.Lock()
	defer packageLock.Unlock()

113
	r, err := newFSRepo(repoPath)
114 115 116 117
	if err != nil {
		return nil, err
	}

118 119 120
	// Check if its initialized
	if err := checkInitialized(r.path); err != nil {
		return nil, err
121
	}
Tommi Virtanen's avatar
Tommi Virtanen committed
122

Tommi Virtanen's avatar
Tommi Virtanen committed
123 124 125 126 127 128 129 130 131 132 133 134
	r.lockfile, err = lockfile.Lock(r.path)
	if err != nil {
		return nil, err
	}
	keepLocked := false
	defer func() {
		// unlock on error, leave it locked on success
		if !keepLocked {
			r.lockfile.Close()
		}
	}()

135
	// Check version, and error out if not matching
136
	ver, err := mfsr.RepoPath(r.path).Version()
137 138
	if err != nil {
		if os.IsNotExist(err) {
139
			return nil, ErrNoVersion
140 141 142 143
		}
		return nil, err
	}

144
	if ver != RepoVersion {
145
		return nil, fmt.Errorf(errIncorrectRepoFmt, ver, RepoVersion)
146 147
	}

148 149 150 151 152 153 154 155 156 157 158 159 160
	// check repo path, then check all constituent parts.
	if err := dir.Writable(r.path); err != nil {
		return nil, err
	}

	if err := r.openConfig(); err != nil {
		return nil, err
	}

	if err := r.openDatastore(); err != nil {
		return nil, err
	}

Tommi Virtanen's avatar
Tommi Virtanen committed
161
	keepLocked = true
162
	return r, nil
163 164
}

165 166 167 168 169 170 171 172 173 174 175 176 177
func newFSRepo(rpath string) (*FSRepo, error) {
	expPath, err := u.TildeExpansion(path.Clean(rpath))
	if err != nil {
		return nil, err
	}

	return &FSRepo{path: expPath}, nil
}

func checkInitialized(path string) error {
	if !isInitializedUnsynced(path) {
		alt := strings.Replace(path, ".ipfs", ".go-ipfs", 1)
		if isInitializedUnsynced(alt) {
178
			return ErrOldRepo
179
		}
180
		return NoRepoError{Path: path}
181 182 183 184
	}
	return nil
}

185 186 187
// ConfigAt returns an error if the FSRepo at the given path is not
// initialized. This function allows callers to read the config file even when
// another process is running and holding the lock.
Brian Tiger Chow's avatar
huh  
Brian Tiger Chow committed
188
func ConfigAt(repoPath string) (*config.Config, error) {
189 190 191 192 193

	// packageLock must be held to ensure that the Read is atomic.
	packageLock.Lock()
	defer packageLock.Unlock()

Brian Tiger Chow's avatar
huh  
Brian Tiger Chow committed
194 195 196 197
	configFilename, err := config.Filename(repoPath)
	if err != nil {
		return nil, err
	}
198
	return serialize.Load(configFilename)
Brian Tiger Chow's avatar
huh  
Brian Tiger Chow committed
199 200
}

201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230
// configIsInitialized returns true if the repo is initialized at
// provided |path|.
func configIsInitialized(path string) bool {
	configFilename, err := config.Filename(path)
	if err != nil {
		return false
	}
	if !util.FileExists(configFilename) {
		return false
	}
	return true
}

func initConfig(path string, conf *config.Config) error {
	if configIsInitialized(path) {
		return nil
	}
	configFilename, err := config.Filename(path)
	if err != nil {
		return err
	}
	// initialization is the one time when it's okay to write to the config
	// without reading the config from disk and merging any user-provided keys
	// that may exist.
	if err := serialize.WriteConfigFile(configFilename, conf); err != nil {
		return err
	}
	return nil
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
231
// Init initializes a new FSRepo at the given path with the provided config.
232
// TODO add support for custom datastores.
233
func Init(repoPath string, conf *config.Config) error {
234 235 236 237

	// packageLock must be held to ensure that the repo is not initialized more
	// than once.
	packageLock.Lock()
238
	defer packageLock.Unlock()
239

240
	if isInitializedUnsynced(repoPath) {
241 242
		return nil
	}
243

244
	if err := initConfig(repoPath, conf); err != nil {
245 246 247
		return err
	}

248 249
	// The actual datastore contents are initialized lazily when Opened.
	// During Init, we merely check that the directory is writeable.
250 251
	leveldbPath := path.Join(repoPath, leveldbDirectory)
	if err := dir.Writable(leveldbPath); err != nil {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
252
		return fmt.Errorf("datastore: %s", err)
253
	}
254

255 256 257 258 259
	flatfsPath := path.Join(repoPath, flatfsDirectory)
	if err := dir.Writable(flatfsPath); err != nil {
		return fmt.Errorf("datastore: %s", err)
	}

260 261 262 263
	if err := dir.Writable(path.Join(repoPath, "logs")); err != nil {
		return err
	}

264 265 266 267
	if err := mfsr.RepoPath(repoPath).WriteVersion(RepoVersion); err != nil {
		return err
	}

268 269 270
	return nil
}

271
// Remove recursively removes the FSRepo at |path|.
272 273 274
func Remove(repoPath string) error {
	repoPath = path.Clean(repoPath)
	return os.RemoveAll(repoPath)
275 276
}

277 278
// LockedByOtherProcess returns true if the FSRepo is locked by another
// process. If true, then the repo cannot be opened by this process.
279
func LockedByOtherProcess(repoPath string) (bool, error) {
280
	repoPath = path.Clean(repoPath)
281
	// NB: the lock is only held when repos are Open
282
	return lockfile.Locked(repoPath)
283 284
}

285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327
// APIAddr returns the registered API addr, according to the api file
// in the fsrepo. This is a concurrent operation, meaning that any
// process may read this file. modifying this file, therefore, should
// use "mv" to replace the whole file and avoid interleaved read/writes.
func APIAddr(repoPath string) (string, error) {
	repoPath = path.Clean(repoPath)
	apiFilePath := path.Join(repoPath, apiFile)

	// if there is no file, assume there is no api addr.
	f, err := os.Open(apiFilePath)
	if err != nil {
		if os.IsNotExist(err) {
			return "", repo.ErrApiNotRunning
		}
		return "", err
	}
	defer f.Close()

	// read up to 2048 bytes. io.ReadAll is a vulnerability, as
	// someone could hose the process by putting a massive file there.
	buf := make([]byte, 2048)
	n, err := f.Read(buf)
	if err != nil && err != io.EOF {
		return "", err
	}

	s := string(buf[:n])
	s = strings.TrimSpace(s)
	return s, nil
}

// SetAPIAddr writes the API Addr to the /api file.
func (r *FSRepo) SetAPIAddr(addr string) error {
	f, err := os.Create(path.Join(r.path, apiFile))
	if err != nil {
		return err
	}
	defer f.Close()

	_, err = f.WriteString(addr)
	return err
}

328 329 330 331 332 333 334 335 336 337 338 339 340 341
// openConfig returns an error if the config file is not present.
func (r *FSRepo) openConfig() error {
	configFilename, err := config.Filename(r.path)
	if err != nil {
		return err
	}
	conf, err := serialize.Load(configFilename)
	if err != nil {
		return err
	}
	r.config = conf
	return nil
}

342 343
// openDatastore returns an error if the config file is not present.
func (r *FSRepo) openDatastore() error {
344
	leveldbPath := path.Join(r.path, leveldbDirectory)
345 346
	var err error
	// save leveldb reference so it can be neatly closed afterward
Jeromy's avatar
Jeromy committed
347
	leveldbDS, err := levelds.NewDatastore(leveldbPath, &levelds.Options{
348 349 350
		Compression: ldbopts.NoCompression,
	})
	if err != nil {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
351
		return errors.New("unable to open leveldb datastore")
352
	}
353 354 355 356 357 358 359 360 361 362 363 364 365 366

	// 4TB of 256kB objects ~=17M objects, splitting that 256-way
	// leads to ~66k objects per dir, splitting 256*256-way leads to
	// only 256.
	//
	// The keys seen by the block store have predictable prefixes,
	// including "/" from datastore.Key and 2 bytes from multihash. To
	// reach a uniform 256-way split, we need approximately 4 bytes of
	// prefix.
	blocksDS, err := flatfs.New(path.Join(r.path, flatfsDirectory), 4)
	if err != nil {
		return errors.New("unable to open flatfs datastore")
	}

367 368 369 370 371 372 373 374 375 376
	// Add our PeerID to metrics paths to keep them unique
	//
	// As some tests just pass a zero-value Config to fsrepo.Init,
	// cope with missing PeerID.
	id := r.config.Identity.PeerID
	if id == "" {
		// the tests pass in a zero Config; cope with it
		id = fmt.Sprintf("uninitialized_%p", r)
	}
	prefix := "fsrepo." + id + ".datastore."
Jeromy's avatar
Jeromy committed
377 378
	metricsBlocks := measure.New(prefix+"blocks", blocksDS)
	metricsLevelDB := measure.New(prefix+"leveldb", leveldbDS)
379
	mountDS := mount.New([]mount.Mount{
380 381
		{
			Prefix:    ds.NewKey("/blocks"),
Jeromy's avatar
Jeromy committed
382
			Datastore: metricsBlocks,
383 384 385
		},
		{
			Prefix:    ds.NewKey("/"),
Jeromy's avatar
Jeromy committed
386
			Datastore: metricsLevelDB,
387
		},
388 389 390 391 392 393 394
	})
	// Make sure it's ok to claim the virtual datastore from mount as
	// threadsafe. There's no clean way to make mount itself provide
	// this information without copy-pasting the code into two
	// variants. This is the same dilemma as the `[].byte` attempt at
	// introducing const types to Go.
	var _ ds.ThreadSafeDatastore = blocksDS
Jeromy's avatar
Jeromy committed
395
	var _ ds.ThreadSafeDatastore = leveldbDS
396
	r.ds = ds2.ClaimThreadSafe{mountDS}
397 398 399
	return nil
}

400 401 402 403 404
// Close closes the FSRepo, releasing held resources.
func (r *FSRepo) Close() error {
	packageLock.Lock()
	defer packageLock.Unlock()

405
	if r.closed {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
406
		return errors.New("repo is closed")
407
	}
408

Jeromy's avatar
Jeromy committed
409
	if err := r.ds.(io.Closer).Close(); err != nil {
410
		return err
411
	}
412 413 414 415 416 417 418

	// This code existed in the previous versions, but
	// EventlogComponent.Close was never called. Preserving here
	// pending further discussion.
	//
	// TODO It isn't part of the current contract, but callers may like for us
	// to disable logging once the component is closed.
Jeromy's avatar
Jeromy committed
419
	// logging.Configure(logging.Output(os.Stderr))
420

421 422 423 424 425
	r.closed = true
	if err := r.lockfile.Close(); err != nil {
		return err
	}
	return nil
426 427
}

428
// Result when not Open is undefined. The method may panic if it pleases.
429
func (r *FSRepo) Config() (*config.Config, error) {
430 431 432 433 434 435 436 437 438

	// It is not necessary to hold the package lock since the repo is in an
	// opened state. The package lock is _not_ meant to ensure that the repo is
	// thread-safe. The package lock is only meant to guard againt removal and
	// coordinate the lockfile. However, we provide thread-safety to keep
	// things simple.
	packageLock.Lock()
	defer packageLock.Unlock()

439
	if r.closed {
440
		return nil, errors.New("cannot access config, repo not open")
441
	}
442
	return r.config, nil
443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469
}

// setConfigUnsynced is for private use.
func (r *FSRepo) setConfigUnsynced(updated *config.Config) error {
	configFilename, err := config.Filename(r.path)
	if err != nil {
		return err
	}
	// to avoid clobbering user-provided keys, must read the config from disk
	// as a map, write the updated struct values to the map and write the map
	// to disk.
	var mapconf map[string]interface{}
	if err := serialize.ReadConfigFile(configFilename, &mapconf); err != nil {
		return err
	}
	m, err := config.ToMap(updated)
	if err != nil {
		return err
	}
	for k, v := range m {
		mapconf[k] = v
	}
	if err := serialize.WriteConfigFile(configFilename, mapconf); err != nil {
		return err
	}
	*r.config = *updated // copy so caller cannot modify this private config
	return nil
470 471
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
472
// SetConfig updates the FSRepo's config.
473
func (r *FSRepo) SetConfig(updated *config.Config) error {
474 475 476 477 478

	// packageLock is held to provide thread-safety.
	packageLock.Lock()
	defer packageLock.Unlock()

479
	return r.setConfigUnsynced(updated)
480 481
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
482
// GetConfigKey retrieves only the value of a particular key.
483
func (r *FSRepo) GetConfigKey(key string) (interface{}, error) {
484 485 486
	packageLock.Lock()
	defer packageLock.Unlock()

487
	if r.closed {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
488
		return nil, errors.New("repo is closed")
489
	}
490 491 492 493 494 495 496 497 498 499

	filename, err := config.Filename(r.path)
	if err != nil {
		return nil, err
	}
	var cfg map[string]interface{}
	if err := serialize.ReadConfigFile(filename, &cfg); err != nil {
		return nil, err
	}
	return common.MapGetKV(cfg, key)
500 501
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
502
// SetConfigKey writes the value of a particular key.
503
func (r *FSRepo) SetConfigKey(key string, value interface{}) error {
504 505 506
	packageLock.Lock()
	defer packageLock.Unlock()

507
	if r.closed {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
508
		return errors.New("repo is closed")
509
	}
510 511 512 513 514 515 516 517 518

	filename, err := config.Filename(r.path)
	if err != nil {
		return err
	}
	var mapconf map[string]interface{}
	if err := serialize.ReadConfigFile(filename, &mapconf); err != nil {
		return err
	}
519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556

	// Get the type of the value associated with the key
	oldValue, err := common.MapGetKV(mapconf, key)
	ok := true
	if err != nil {
		// key-value does not exist yet
		switch v := value.(type) {
		case string:
			value, err = strconv.ParseBool(v)
			if err != nil {
				value, err = strconv.Atoi(v)
				if err != nil {
					value, err = strconv.ParseFloat(v, 32)
					if err != nil {
						value = v
					}
				}
			}
		default:
		}
	} else {
		switch oldValue.(type) {
		case bool:
			value, ok = value.(bool)
		case int:
			value, ok = value.(int)
		case float32:
			value, ok = value.(float32)
		case string:
			value, ok = value.(string)
		default:
			value = value
		}
		if !ok {
			return fmt.Errorf("Wrong config type, expected %T", oldValue)
		}
	}

557 558 559
	if err := common.MapSetKV(mapconf, key, value); err != nil {
		return err
	}
560 561 562

	// This step doubles as to validate the map against the struct
	// before serialization
563 564 565 566 567 568 569 570
	conf, err := config.FromMap(mapconf)
	if err != nil {
		return err
	}
	if err := serialize.WriteConfigFile(filename, mapconf); err != nil {
		return err
	}
	return r.setConfigUnsynced(conf) // TODO roll this into this method
571 572
}

573 574 575 576
// Datastore returns a repo-owned datastore. If FSRepo is Closed, return value
// is undefined.
func (r *FSRepo) Datastore() ds.ThreadSafeDatastore {
	packageLock.Lock()
577
	d := r.ds
578 579 580 581
	packageLock.Unlock()
	return d
}

582
var _ io.Closer = &FSRepo{}
583
var _ repo.Repo = &FSRepo{}
584

585 586
// IsInitialized returns true if the repo is initialized at provided |path|.
func IsInitialized(path string) bool {
587 588
	// packageLock is held to ensure that another caller doesn't attempt to
	// Init or Remove the repo while this call is in progress.
589 590
	packageLock.Lock()
	defer packageLock.Unlock()
591

592
	return isInitializedUnsynced(path)
593 594
}

595 596
// private methods below this point. NB: packageLock must held by caller.

597
// isInitializedUnsynced reports whether the repo is initialized. Caller must
598
// hold the packageLock.
599 600
func isInitializedUnsynced(repoPath string) bool {
	if !configIsInitialized(repoPath) {
601 602
		return false
	}
603
	if !util.FileExists(path.Join(repoPath, leveldbDirectory)) {
604
		return false
605 606
	}
	return true
607
}