Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
M
mariadb
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
Analytics
Analytics
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Commits
Issue Boards
Open sidebar
Kirill Smelkov
mariadb
Commits
72765abf
Commit
72765abf
authored
Sep 26, 2006
by
jonas@perch.ndb.mysql.com
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
ndb - bug#20895
Fix occational LCP hang!!! Make sure only to consider alive nodes in startNextChkpt
parent
0d360045
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
71 additions
and
60 deletions
+71
-60
ndb/src/kernel/blocks/dbdih/DbdihMain.cpp
ndb/src/kernel/blocks/dbdih/DbdihMain.cpp
+71
-60
No files found.
ndb/src/kernel/blocks/dbdih/DbdihMain.cpp
View file @
72765abf
...
@@ -9561,15 +9561,19 @@ void Dbdih::startNextChkpt(Signal* signal)
...
@@ -9561,15 +9561,19 @@ void Dbdih::startNextChkpt(Signal* signal)
nodePtr
.
i
=
replicaPtr
.
p
->
procNode
;
nodePtr
.
i
=
replicaPtr
.
p
->
procNode
;
ptrCheckGuard
(
nodePtr
,
MAX_NDB_NODES
,
nodeRecord
);
ptrCheckGuard
(
nodePtr
,
MAX_NDB_NODES
,
nodeRecord
);
if
(
c_lcpState
.
m_participatingLQH
.
get
(
nodePtr
.
i
))
{
if
(
replicaPtr
.
p
->
lcpOngoingFlag
&&
if
(
replicaPtr
.
p
->
lcpOngoingFlag
&&
replicaPtr
.
p
->
lcpIdStarted
<
lcpId
)
{
replicaPtr
.
p
->
lcpIdStarted
<
lcpId
)
{
jam
();
jam
();
//-------------------------------------------------------------------
//-------------------------------------------------------------------
// We have found a replica on a node that performs local checkpoint
// We have found a replica on a node that performs local checkpoint
// that is alive and that have not yet been started.
// that is alive and that have not yet been started.
//-------------------------------------------------------------------
//-------------------------------------------------------------------
if
(
nodePtr
.
p
->
noOfStartedChkpt
<
2
)
{
if
(
nodePtr
.
p
->
noOfStartedChkpt
<
2
)
{
jam
();
jam
();
/**
/**
* Send LCP_FRAG_ORD to LQH
* Send LCP_FRAG_ORD to LQH
...
@@ -9587,7 +9591,9 @@ void Dbdih::startNextChkpt(Signal* signal)
...
@@ -9587,7 +9591,9 @@ void Dbdih::startNextChkpt(Signal* signal)
nodePtr
.
p
->
noOfStartedChkpt
=
i
+
1
;
nodePtr
.
p
->
noOfStartedChkpt
=
i
+
1
;
sendLCP_FRAG_ORD
(
signal
,
nodePtr
.
p
->
startedChkpt
[
i
]);
sendLCP_FRAG_ORD
(
signal
,
nodePtr
.
p
->
startedChkpt
[
i
]);
}
else
if
(
nodePtr
.
p
->
noOfQueuedChkpt
<
2
)
{
}
else
if
(
nodePtr
.
p
->
noOfQueuedChkpt
<
2
)
{
jam
();
jam
();
/**
/**
* Put LCP_FRAG_ORD "in queue"
* Put LCP_FRAG_ORD "in queue"
...
@@ -9603,10 +9609,13 @@ void Dbdih::startNextChkpt(Signal* signal)
...
@@ -9603,10 +9609,13 @@ void Dbdih::startNextChkpt(Signal* signal)
nodePtr
.
p
->
queuedChkpt
[
i
].
fragId
=
curr
.
fragmentId
;
nodePtr
.
p
->
queuedChkpt
[
i
].
fragId
=
curr
.
fragmentId
;
nodePtr
.
p
->
queuedChkpt
[
i
].
replicaPtr
=
replicaPtr
.
i
;
nodePtr
.
p
->
queuedChkpt
[
i
].
replicaPtr
=
replicaPtr
.
i
;
nodePtr
.
p
->
noOfQueuedChkpt
=
i
+
1
;
nodePtr
.
p
->
noOfQueuedChkpt
=
i
+
1
;
}
else
{
}
else
{
jam
();
jam
();
if
(
save
){
if
(
save
)
{
/**
/**
* Stop increasing value on first that was "full"
* Stop increasing value on first that was "full"
*/
*/
...
@@ -9615,7 +9624,8 @@ void Dbdih::startNextChkpt(Signal* signal)
...
@@ -9615,7 +9624,8 @@ void Dbdih::startNextChkpt(Signal* signal)
}
}
busyNodes
.
set
(
nodePtr
.
i
);
busyNodes
.
set
(
nodePtr
.
i
);
if
(
busyNodes
.
count
()
==
lcpNodes
){
if
(
busyNodes
.
count
()
==
lcpNodes
)
{
/**
/**
* There were no possibility to start the local checkpoint
* There were no possibility to start the local checkpoint
* and it was not possible to queue it up. In this case we
* and it was not possible to queue it up. In this case we
...
@@ -9628,6 +9638,7 @@ void Dbdih::startNextChkpt(Signal* signal)
...
@@ -9628,6 +9638,7 @@ void Dbdih::startNextChkpt(Signal* signal)
}
//if
}
//if
}
}
}
//while
}
//while
}
curr
.
fragmentId
++
;
curr
.
fragmentId
++
;
if
(
curr
.
fragmentId
>=
tabPtr
.
p
->
totalfragments
)
{
if
(
curr
.
fragmentId
>=
tabPtr
.
p
->
totalfragments
)
{
jam
();
jam
();
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment