fsrepo.go 16.7 KB
Newer Older
1 2 3
package fsrepo

import (
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
4 5
	"errors"
	"fmt"
6
	"io"
7
	"os"
8
	"path"
9
	"strconv"
10
	"strings"
11
	"sync"
12

13
	ds "github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore"
14
	"github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore/flatfs"
15
	levelds "github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore/leveldb"
16
	"github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore/measure"
17
	"github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/jbenet/go-datastore/mount"
18 19 20 21 22
	ldbopts "github.com/ipfs/go-ipfs/Godeps/_workspace/src/github.com/syndtr/goleveldb/leveldb/opt"
	repo "github.com/ipfs/go-ipfs/repo"
	"github.com/ipfs/go-ipfs/repo/common"
	config "github.com/ipfs/go-ipfs/repo/config"
	lockfile "github.com/ipfs/go-ipfs/repo/fsrepo/lock"
23
	mfsr "github.com/ipfs/go-ipfs/repo/fsrepo/migrations"
24 25 26 27 28 29
	serialize "github.com/ipfs/go-ipfs/repo/fsrepo/serialize"
	dir "github.com/ipfs/go-ipfs/thirdparty/dir"
	"github.com/ipfs/go-ipfs/thirdparty/eventlog"
	u "github.com/ipfs/go-ipfs/util"
	util "github.com/ipfs/go-ipfs/util"
	ds2 "github.com/ipfs/go-ipfs/util/datastore2"
30 31
)

32
// version number that we are currently expecting to see
33 34
var RepoVersion = "2"

35 36
var migrationInstructions = `See https://github.com/ipfs/fs-repo-migrations/blob/master/run.md
Sorry for the inconvenience. In the future, these will run automatically.`
37

38 39 40 41 42 43 44 45 46
var errIncorrectRepoFmt = `Repo has incorrect version: %s
Program version is: %s
Please run the ipfs migration tool before continuing.
` + migrationInstructions

var (
	ErrNoVersion = errors.New("no version file found, please run 0-to-1 migration tool.\n" + migrationInstructions)
	ErrOldRepo   = errors.New("ipfs repo found in old '~/.go-ipfs' location, please run migration tool.\n" + migrationInstructions)
)
47

48 49 50 51 52 53 54
type NoRepoError struct {
	Path string
}

var _ error = NoRepoError{}

func (err NoRepoError) Error() string {
rht's avatar
rht committed
55
	return fmt.Sprintf("no ipfs repo found in %s.\nplease run: ipfs init", err.Path)
56 57
}

58
const (
59
	leveldbDirectory = "datastore"
60
	flatfsDirectory  = "blocks"
61
	apiFile          = "api"
62 63
)

64
var (
65 66 67

	// packageLock must be held to while performing any operation that modifies an
	// FSRepo's state field. This includes Init, Open, Close, and Remove.
Tommi Virtanen's avatar
Tommi Virtanen committed
68
	packageLock sync.Mutex
69

70 71 72 73 74 75 76 77 78 79 80 81 82
	// onlyOne keeps track of open FSRepo instances.
	//
	// TODO: once command Context / Repo integration is cleaned up,
	// this can be removed. Right now, this makes ConfigCmd.Run
	// function try to open the repo twice:
	//
	//     $ ipfs daemon &
	//     $ ipfs config foo
	//
	// The reason for the above is that in standalone mode without the
	// daemon, `ipfs config` tries to save work by not building the
	// full IpfsNode, but accessing the Repo directly.
	onlyOne repo.OnlyOne
83 84
)

85 86
// FSRepo represents an IPFS FileSystem Repo. It is safe for use by multiple
// callers.
87
type FSRepo struct {
88 89
	// has Close been called already
	closed bool
Brian Tiger Chow's avatar
Brian Tiger Chow committed
90 91
	// path is the file-system path
	path string
92 93 94
	// lockfile is the file system lock to prevent others from opening
	// the same fsrepo path concurrently
	lockfile io.Closer
95
	config   *config.Config
96 97
	ds       ds.ThreadSafeDatastore
	// tracked separately for use in Close; do not use directly.
98 99 100
	leveldbDS      levelds.Datastore
	metricsBlocks  measure.DatastoreCloser
	metricsLevelDB measure.DatastoreCloser
101 102
}

Tommi Virtanen's avatar
Tommi Virtanen committed
103 104
var _ repo.Repo = (*FSRepo)(nil)

105 106
// Open the FSRepo at path. Returns an error if the repo is not
// initialized.
107 108 109 110 111 112 113 114
func Open(repoPath string) (repo.Repo, error) {
	fn := func() (repo.Repo, error) {
		return open(repoPath)
	}
	return onlyOne.Open(repoPath, fn)
}

func open(repoPath string) (repo.Repo, error) {
115 116 117
	packageLock.Lock()
	defer packageLock.Unlock()

118
	r, err := newFSRepo(repoPath)
119 120 121 122
	if err != nil {
		return nil, err
	}

123 124 125
	// Check if its initialized
	if err := checkInitialized(r.path); err != nil {
		return nil, err
126
	}
Tommi Virtanen's avatar
Tommi Virtanen committed
127

Tommi Virtanen's avatar
Tommi Virtanen committed
128 129 130 131 132 133 134 135 136 137 138 139
	r.lockfile, err = lockfile.Lock(r.path)
	if err != nil {
		return nil, err
	}
	keepLocked := false
	defer func() {
		// unlock on error, leave it locked on success
		if !keepLocked {
			r.lockfile.Close()
		}
	}()

140
	// Check version, and error out if not matching
141
	ver, err := mfsr.RepoPath(r.path).Version()
142 143
	if err != nil {
		if os.IsNotExist(err) {
144
			return nil, ErrNoVersion
145 146 147 148
		}
		return nil, err
	}

149
	if ver != RepoVersion {
150
		return nil, fmt.Errorf(errIncorrectRepoFmt, ver, RepoVersion)
151 152
	}

153 154 155 156 157 158 159 160 161 162 163 164 165
	// check repo path, then check all constituent parts.
	if err := dir.Writable(r.path); err != nil {
		return nil, err
	}

	if err := r.openConfig(); err != nil {
		return nil, err
	}

	if err := r.openDatastore(); err != nil {
		return nil, err
	}

166
	// setup eventlogger
167 168
	configureEventLoggerAtRepoPath(r.config, r.path)

Tommi Virtanen's avatar
Tommi Virtanen committed
169
	keepLocked = true
170
	return r, nil
171 172
}

173 174 175 176 177 178 179 180 181 182 183 184 185
func newFSRepo(rpath string) (*FSRepo, error) {
	expPath, err := u.TildeExpansion(path.Clean(rpath))
	if err != nil {
		return nil, err
	}

	return &FSRepo{path: expPath}, nil
}

func checkInitialized(path string) error {
	if !isInitializedUnsynced(path) {
		alt := strings.Replace(path, ".ipfs", ".go-ipfs", 1)
		if isInitializedUnsynced(alt) {
186
			return ErrOldRepo
187
		}
188
		return NoRepoError{Path: path}
189 190 191 192
	}
	return nil
}

193 194 195
// ConfigAt returns an error if the FSRepo at the given path is not
// initialized. This function allows callers to read the config file even when
// another process is running and holding the lock.
Brian Tiger Chow's avatar
huh  
Brian Tiger Chow committed
196
func ConfigAt(repoPath string) (*config.Config, error) {
197 198 199 200 201

	// packageLock must be held to ensure that the Read is atomic.
	packageLock.Lock()
	defer packageLock.Unlock()

Brian Tiger Chow's avatar
huh  
Brian Tiger Chow committed
202 203 204 205
	configFilename, err := config.Filename(repoPath)
	if err != nil {
		return nil, err
	}
206
	return serialize.Load(configFilename)
Brian Tiger Chow's avatar
huh  
Brian Tiger Chow committed
207 208
}

209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238
// configIsInitialized returns true if the repo is initialized at
// provided |path|.
func configIsInitialized(path string) bool {
	configFilename, err := config.Filename(path)
	if err != nil {
		return false
	}
	if !util.FileExists(configFilename) {
		return false
	}
	return true
}

func initConfig(path string, conf *config.Config) error {
	if configIsInitialized(path) {
		return nil
	}
	configFilename, err := config.Filename(path)
	if err != nil {
		return err
	}
	// initialization is the one time when it's okay to write to the config
	// without reading the config from disk and merging any user-provided keys
	// that may exist.
	if err := serialize.WriteConfigFile(configFilename, conf); err != nil {
		return err
	}
	return nil
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
239
// Init initializes a new FSRepo at the given path with the provided config.
240
// TODO add support for custom datastores.
241
func Init(repoPath string, conf *config.Config) error {
242 243 244 245

	// packageLock must be held to ensure that the repo is not initialized more
	// than once.
	packageLock.Lock()
246
	defer packageLock.Unlock()
247

248
	if isInitializedUnsynced(repoPath) {
249 250
		return nil
	}
251

252
	if err := initConfig(repoPath, conf); err != nil {
253 254 255
		return err
	}

256 257
	// The actual datastore contents are initialized lazily when Opened.
	// During Init, we merely check that the directory is writeable.
258 259
	leveldbPath := path.Join(repoPath, leveldbDirectory)
	if err := dir.Writable(leveldbPath); err != nil {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
260
		return fmt.Errorf("datastore: %s", err)
261
	}
262

263 264 265 266 267
	flatfsPath := path.Join(repoPath, flatfsDirectory)
	if err := dir.Writable(flatfsPath); err != nil {
		return fmt.Errorf("datastore: %s", err)
	}

268 269 270 271
	if err := dir.Writable(path.Join(repoPath, "logs")); err != nil {
		return err
	}

272 273 274 275
	if err := mfsr.RepoPath(repoPath).WriteVersion(RepoVersion); err != nil {
		return err
	}

276 277 278
	return nil
}

279
// Remove recursively removes the FSRepo at |path|.
280 281 282
func Remove(repoPath string) error {
	repoPath = path.Clean(repoPath)
	return os.RemoveAll(repoPath)
283 284
}

285 286
// LockedByOtherProcess returns true if the FSRepo is locked by another
// process. If true, then the repo cannot be opened by this process.
287
func LockedByOtherProcess(repoPath string) (bool, error) {
288
	repoPath = path.Clean(repoPath)
289
	// NB: the lock is only held when repos are Open
290
	return lockfile.Locked(repoPath)
291 292
}

293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335
// APIAddr returns the registered API addr, according to the api file
// in the fsrepo. This is a concurrent operation, meaning that any
// process may read this file. modifying this file, therefore, should
// use "mv" to replace the whole file and avoid interleaved read/writes.
func APIAddr(repoPath string) (string, error) {
	repoPath = path.Clean(repoPath)
	apiFilePath := path.Join(repoPath, apiFile)

	// if there is no file, assume there is no api addr.
	f, err := os.Open(apiFilePath)
	if err != nil {
		if os.IsNotExist(err) {
			return "", repo.ErrApiNotRunning
		}
		return "", err
	}
	defer f.Close()

	// read up to 2048 bytes. io.ReadAll is a vulnerability, as
	// someone could hose the process by putting a massive file there.
	buf := make([]byte, 2048)
	n, err := f.Read(buf)
	if err != nil && err != io.EOF {
		return "", err
	}

	s := string(buf[:n])
	s = strings.TrimSpace(s)
	return s, nil
}

// SetAPIAddr writes the API Addr to the /api file.
func (r *FSRepo) SetAPIAddr(addr string) error {
	f, err := os.Create(path.Join(r.path, apiFile))
	if err != nil {
		return err
	}
	defer f.Close()

	_, err = f.WriteString(addr)
	return err
}

336 337 338 339 340 341 342 343 344 345 346 347 348 349
// openConfig returns an error if the config file is not present.
func (r *FSRepo) openConfig() error {
	configFilename, err := config.Filename(r.path)
	if err != nil {
		return err
	}
	conf, err := serialize.Load(configFilename)
	if err != nil {
		return err
	}
	r.config = conf
	return nil
}

350 351
// openDatastore returns an error if the config file is not present.
func (r *FSRepo) openDatastore() error {
352
	leveldbPath := path.Join(r.path, leveldbDirectory)
353 354 355
	var err error
	// save leveldb reference so it can be neatly closed afterward
	r.leveldbDS, err = levelds.NewDatastore(leveldbPath, &levelds.Options{
356 357 358
		Compression: ldbopts.NoCompression,
	})
	if err != nil {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
359
		return errors.New("unable to open leveldb datastore")
360
	}
361 362 363 364 365 366 367 368 369 370 371 372 373 374

	// 4TB of 256kB objects ~=17M objects, splitting that 256-way
	// leads to ~66k objects per dir, splitting 256*256-way leads to
	// only 256.
	//
	// The keys seen by the block store have predictable prefixes,
	// including "/" from datastore.Key and 2 bytes from multihash. To
	// reach a uniform 256-way split, we need approximately 4 bytes of
	// prefix.
	blocksDS, err := flatfs.New(path.Join(r.path, flatfsDirectory), 4)
	if err != nil {
		return errors.New("unable to open flatfs datastore")
	}

375 376 377 378 379 380 381 382 383 384 385 386
	// Add our PeerID to metrics paths to keep them unique
	//
	// As some tests just pass a zero-value Config to fsrepo.Init,
	// cope with missing PeerID.
	id := r.config.Identity.PeerID
	if id == "" {
		// the tests pass in a zero Config; cope with it
		id = fmt.Sprintf("uninitialized_%p", r)
	}
	prefix := "fsrepo." + id + ".datastore."
	r.metricsBlocks = measure.New(prefix+"blocks", blocksDS)
	r.metricsLevelDB = measure.New(prefix+"leveldb", r.leveldbDS)
387
	mountDS := mount.New([]mount.Mount{
388 389 390 391 392 393 394 395
		{
			Prefix:    ds.NewKey("/blocks"),
			Datastore: r.metricsBlocks,
		},
		{
			Prefix:    ds.NewKey("/"),
			Datastore: r.metricsLevelDB,
		},
396 397 398 399 400 401 402 403 404
	})
	// Make sure it's ok to claim the virtual datastore from mount as
	// threadsafe. There's no clean way to make mount itself provide
	// this information without copy-pasting the code into two
	// variants. This is the same dilemma as the `[].byte` attempt at
	// introducing const types to Go.
	var _ ds.ThreadSafeDatastore = blocksDS
	var _ ds.ThreadSafeDatastore = r.leveldbDS
	r.ds = ds2.ClaimThreadSafe{mountDS}
405 406 407
	return nil
}

408 409 410
func configureEventLoggerAtRepoPath(c *config.Config, repoPath string) {
	eventlog.Configure(eventlog.LevelInfo)
	eventlog.Configure(eventlog.LdJSONFormatter)
Jeromy's avatar
Jeromy committed
411
	eventlog.Configure(eventlog.Output(eventlog.WriterGroup))
412 413
}

414 415 416 417 418
// Close closes the FSRepo, releasing held resources.
func (r *FSRepo) Close() error {
	packageLock.Lock()
	defer packageLock.Unlock()

419
	if r.closed {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
420
		return errors.New("repo is closed")
421
	}
422

423 424 425 426 427 428
	if err := r.metricsBlocks.Close(); err != nil {
		return err
	}
	if err := r.metricsLevelDB.Close(); err != nil {
		return err
	}
429
	if err := r.leveldbDS.Close(); err != nil {
430
		return err
431
	}
432 433 434 435 436 437 438 439 440

	// This code existed in the previous versions, but
	// EventlogComponent.Close was never called. Preserving here
	// pending further discussion.
	//
	// TODO It isn't part of the current contract, but callers may like for us
	// to disable logging once the component is closed.
	// eventlog.Configure(eventlog.Output(os.Stderr))

441 442 443 444 445
	r.closed = true
	if err := r.lockfile.Close(); err != nil {
		return err
	}
	return nil
446 447
}

448
// Result when not Open is undefined. The method may panic if it pleases.
449
func (r *FSRepo) Config() (*config.Config, error) {
450 451 452 453 454 455 456 457 458

	// It is not necessary to hold the package lock since the repo is in an
	// opened state. The package lock is _not_ meant to ensure that the repo is
	// thread-safe. The package lock is only meant to guard againt removal and
	// coordinate the lockfile. However, we provide thread-safety to keep
	// things simple.
	packageLock.Lock()
	defer packageLock.Unlock()

459
	if r.closed {
460
		return nil, errors.New("cannot access config, repo not open")
461
	}
462
	return r.config, nil
463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489
}

// setConfigUnsynced is for private use.
func (r *FSRepo) setConfigUnsynced(updated *config.Config) error {
	configFilename, err := config.Filename(r.path)
	if err != nil {
		return err
	}
	// to avoid clobbering user-provided keys, must read the config from disk
	// as a map, write the updated struct values to the map and write the map
	// to disk.
	var mapconf map[string]interface{}
	if err := serialize.ReadConfigFile(configFilename, &mapconf); err != nil {
		return err
	}
	m, err := config.ToMap(updated)
	if err != nil {
		return err
	}
	for k, v := range m {
		mapconf[k] = v
	}
	if err := serialize.WriteConfigFile(configFilename, mapconf); err != nil {
		return err
	}
	*r.config = *updated // copy so caller cannot modify this private config
	return nil
490 491
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
492
// SetConfig updates the FSRepo's config.
493
func (r *FSRepo) SetConfig(updated *config.Config) error {
494 495 496 497 498

	// packageLock is held to provide thread-safety.
	packageLock.Lock()
	defer packageLock.Unlock()

499
	return r.setConfigUnsynced(updated)
500 501
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
502
// GetConfigKey retrieves only the value of a particular key.
503
func (r *FSRepo) GetConfigKey(key string) (interface{}, error) {
504 505 506
	packageLock.Lock()
	defer packageLock.Unlock()

507
	if r.closed {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
508
		return nil, errors.New("repo is closed")
509
	}
510 511 512 513 514 515 516 517 518 519

	filename, err := config.Filename(r.path)
	if err != nil {
		return nil, err
	}
	var cfg map[string]interface{}
	if err := serialize.ReadConfigFile(filename, &cfg); err != nil {
		return nil, err
	}
	return common.MapGetKV(cfg, key)
520 521
}

Brian Tiger Chow's avatar
Brian Tiger Chow committed
522
// SetConfigKey writes the value of a particular key.
523
func (r *FSRepo) SetConfigKey(key string, value interface{}) error {
524 525 526
	packageLock.Lock()
	defer packageLock.Unlock()

527
	if r.closed {
Juan Batiz-Benet's avatar
Juan Batiz-Benet committed
528
		return errors.New("repo is closed")
529
	}
530 531 532 533 534 535 536 537 538

	filename, err := config.Filename(r.path)
	if err != nil {
		return err
	}
	var mapconf map[string]interface{}
	if err := serialize.ReadConfigFile(filename, &mapconf); err != nil {
		return err
	}
539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576

	// Get the type of the value associated with the key
	oldValue, err := common.MapGetKV(mapconf, key)
	ok := true
	if err != nil {
		// key-value does not exist yet
		switch v := value.(type) {
		case string:
			value, err = strconv.ParseBool(v)
			if err != nil {
				value, err = strconv.Atoi(v)
				if err != nil {
					value, err = strconv.ParseFloat(v, 32)
					if err != nil {
						value = v
					}
				}
			}
		default:
		}
	} else {
		switch oldValue.(type) {
		case bool:
			value, ok = value.(bool)
		case int:
			value, ok = value.(int)
		case float32:
			value, ok = value.(float32)
		case string:
			value, ok = value.(string)
		default:
			value = value
		}
		if !ok {
			return fmt.Errorf("Wrong config type, expected %T", oldValue)
		}
	}

577 578 579
	if err := common.MapSetKV(mapconf, key, value); err != nil {
		return err
	}
580 581 582

	// This step doubles as to validate the map against the struct
	// before serialization
583 584 585 586 587 588 589 590
	conf, err := config.FromMap(mapconf)
	if err != nil {
		return err
	}
	if err := serialize.WriteConfigFile(filename, mapconf); err != nil {
		return err
	}
	return r.setConfigUnsynced(conf) // TODO roll this into this method
591 592
}

593 594 595 596
// Datastore returns a repo-owned datastore. If FSRepo is Closed, return value
// is undefined.
func (r *FSRepo) Datastore() ds.ThreadSafeDatastore {
	packageLock.Lock()
597
	d := r.ds
598 599 600 601
	packageLock.Unlock()
	return d
}

602
var _ io.Closer = &FSRepo{}
603
var _ repo.Repo = &FSRepo{}
604

605 606
// IsInitialized returns true if the repo is initialized at provided |path|.
func IsInitialized(path string) bool {
607 608
	// packageLock is held to ensure that another caller doesn't attempt to
	// Init or Remove the repo while this call is in progress.
609 610
	packageLock.Lock()
	defer packageLock.Unlock()
611

612
	return isInitializedUnsynced(path)
613 614
}

615 616
// private methods below this point. NB: packageLock must held by caller.

617
// isInitializedUnsynced reports whether the repo is initialized. Caller must
618
// hold the packageLock.
619 620
func isInitializedUnsynced(repoPath string) bool {
	if !configIsInitialized(repoPath) {
621 622
		return false
	}
623
	if !util.FileExists(path.Join(repoPath, leveldbDirectory)) {
624
		return false
625 626
	}
	return true
627
}