Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
N
neoppod
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Levin Zimmermann
neoppod
Commits
cd68d92f
Commit
cd68d92f
authored
Aug 01, 2017
by
Kirill Smelkov
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
.
parent
72ee34f1
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
30 additions
and
16 deletions
+30
-16
go/neo/server/master.go
go/neo/server/master.go
+22
-11
go/neo/server/storage.go
go/neo/server/storage.go
+8
-5
No files found.
go/neo/server/master.go
View file @
cd68d92f
...
...
@@ -55,7 +55,7 @@ type Master struct {
// channels controlling main driver
ctlStart
chan
chan
error
// request to start cluster
ctlStop
chan
chan
error
// request to stop cluster
ctlStop
chan
chan
struct
{}
// request to stop cluster
ctlShutdown
chan
chan
error
// request to shutdown cluster XXX with ctx ?
// channels from workers directly serving peers to main driver
...
...
@@ -92,7 +92,7 @@ func NewMaster(clusterName, serveAddr string, net xnet.Networker) *Master {
masterAddr
:
serveAddr
,
// XXX ok?
ctlStart
:
make
(
chan
chan
error
),
ctlStop
:
make
(
chan
chan
error
),
ctlStop
:
make
(
chan
chan
struct
{}
),
ctlShutdown
:
make
(
chan
chan
error
),
nodeCome
:
make
(
chan
nodeCome
),
...
...
@@ -116,8 +116,8 @@ func (m *Master) Run(ctx context.Context) error {
m
.
masterAddr
=
l
.
Addr
()
.
String
()
// serve incoming connections
wg
:=
sync
.
WaitGroup
{}
serveCtx
,
serveCancel
:=
context
.
WithCancel
(
ctx
)
wg
.
Add
(
1
)
go
func
()
{
...
...
@@ -126,7 +126,9 @@ func (m *Master) Run(ctx context.Context) error {
_
=
err
// XXX what to do with err ?
}()
// main driving logic
err
=
m
.
runMain
(
ctx
)
serveCancel
()
wg
.
Wait
()
...
...
@@ -147,9 +149,8 @@ func (m *Master) Start() error {
}
// Stop requests cluster to eventually transition into recovery state
// XXX should be always possible ?
func
(
m
*
Master
)
Stop
()
error
{
ech
:=
make
(
chan
error
)
func
(
m
*
Master
)
Stop
()
{
ech
:=
make
(
chan
struct
{})
m
.
ctlStop
<-
ech
return
<-
ech
}
...
...
@@ -177,20 +178,27 @@ func (m *Master) runMain(ctx context.Context) (err error) {
// NOTE Run's goroutine is the only mutator of nodeTab, partTab and other cluster state
for
ctx
.
Err
()
==
nil
{
// recover partition table from storages and wait till enough
// storages connects us so that we can see the partition table
// can be operational.
//
// Successful recovery means all ^^^ preconditions are met and
// a command came to us to start the cluster.
err
:=
m
.
recovery
(
ctx
)
if
err
!=
nil
{
fmt
.
Println
(
err
)
return
err
// recovery cancelled
}
// successful recovery -> verify
// make sure transactions on storages are properly finished, in
// case previously it was unclean shutdown.
err
=
m
.
verify
(
ctx
)
if
err
!=
nil
{
fmt
.
Println
(
err
)
continue
// -> recovery
}
//
successful verify -> service
//
provide service as long as partition table stays operational
err
=
m
.
service
(
ctx
)
if
err
!=
nil
{
fmt
.
Println
(
err
)
...
...
@@ -301,7 +309,7 @@ loop:
ech
<-
fmt
.
Errorf
(
"start: cluster is non-operational"
)
case
ech
:=
<-
m
.
ctlStop
:
ech
<-
nil
//
we are already recovering
close
(
ech
)
// ok;
we are already recovering
case
<-
ctx
.
Done
()
:
err
=
ctx
.
Err
()
...
...
@@ -491,7 +499,7 @@ loop:
ech
<-
nil
// we are already starting
case
ech
:=
<-
m
.
ctlStop
:
ech
<-
nil
// ok
close
(
ech
)
// ok
err
=
errStopRequested
break
loop
...
...
@@ -577,6 +585,8 @@ func (m *Master) service(ctx context.Context) (err error) {
// XXX we also need to tell storages StartOperation first
m
.
setClusterState
(
neo
.
ClusterRunning
)
// XXX spawn per-storage driver about nodetab
loop
:
for
{
select
{
...
...
@@ -604,8 +614,9 @@ loop:
ech
<-
nil
// we are already started
case
ech
:=
<-
m
.
ctlStop
:
ech
<-
nil
// ok
close
(
ech
)
// ok
err
=
fmt
.
Errorf
(
"stop requested"
)
// XXX tell storages to stop
break
loop
case
<-
ctx
.
Done
()
:
...
...
go/neo/server/storage.go
View file @
cd68d92f
...
...
@@ -34,9 +34,7 @@ import (
"lab.nexedi.com/kirr/go123/xerr"
)
// XXX fmt -> log
// Storage is NEO storage server application
// Storage is NEO node that keeps data and provides read/write access to it
type
Storage
struct
{
neo
.
NodeCommon
...
...
@@ -60,6 +58,7 @@ type Storage struct {
// Use Run to actually start running the node.
func
NewStorage
(
cluster
,
masterAddr
,
serveAddr
string
,
net
xnet
.
Networker
,
zstor
zodb
.
IStorage
)
*
Storage
{
// convert serveAddr into neo format
// XXX -> new.NewNode() ?
addr
,
err
:=
neo
.
AddrString
(
net
.
Network
(),
serveAddr
)
if
err
!=
nil
{
panic
(
err
)
// XXX
...
...
@@ -86,7 +85,7 @@ func NewStorage(cluster, masterAddr, serveAddr string, net xnet.Networker, zstor
// commands it to shutdown.
func
(
stor
*
Storage
)
Run
(
ctx
context
.
Context
)
error
{
// start listening
l
,
err
:=
stor
.
Listen
()
l
,
err
:=
stor
.
node
.
Listen
()
if
err
!=
nil
{
return
err
// XXX err ctx
}
...
...
@@ -112,7 +111,7 @@ func (stor *Storage) Run(ctx context.Context) error {
return
err
// XXX err ctx
}
// --- c
hannel with master directing
us ---
// --- c
onnect to master and let it direct
us ---
// talkMaster connects to master, announces self and receives commands and notifications.
// it tries to persist master link reconnecting as needed
...
...
@@ -293,6 +292,10 @@ func (stor *Storage) m1initialize(ctx context.Context, Mconn *neo.Conn) (err err
// m1serve drives storage by master messages during service phase
//
// Service is regular phase serving requests from clients to load/save object,
// handling transaction commit (with master) and syncing data with other
// storage nodes (XXX correct?).
//
// it always returns with an error describing why serve has to be stopped -
// either due to master commanding us to stop, or context cancel or some other
// error.
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment