Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
N
neoppod
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Jérome Perrin
neoppod
Commits
ca75709f
Commit
ca75709f
authored
Nov 07, 2017
by
Julien Muchembled
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
storage: disable data deduplication by default
parent
03b5b47e
Changes
11
Hide whitespace changes
Inline
Side-by-side
Showing
11 changed files
with
41 additions
and
33 deletions
+41
-33
neo/lib/config.py
neo/lib/config.py
+3
-0
neo/scripts/neostorage.py
neo/scripts/neostorage.py
+3
-0
neo/storage/app.py
neo/storage/app.py
+1
-1
neo/storage/database/importer.py
neo/storage/database/importer.py
+2
-2
neo/storage/database/manager.py
neo/storage/database/manager.py
+3
-3
neo/storage/database/mysqldb.py
neo/storage/database/mysqldb.py
+4
-4
neo/storage/database/sqlite.py
neo/storage/database/sqlite.py
+5
-4
neo/tests/storage/testStorageMySQL.py
neo/tests/storage/testStorageMySQL.py
+1
-1
neo/tests/storage/testStorageSQLite.py
neo/tests/storage/testStorageSQLite.py
+1
-1
neo/tests/threaded/__init__.py
neo/tests/threaded/__init__.py
+2
-2
neo/tests/threaded/test.py
neo/tests/threaded/test.py
+16
-15
No files found.
neo/lib/config.py
View file @
ca75709f
...
...
@@ -147,3 +147,6 @@ class ConfigurationManager(object):
n
=
self
.
__get
(
'autostart'
,
True
)
if
n
:
return
int
(
n
)
def
getDedup
(
self
):
return
self
.
__get
(
'dedup'
,
True
)
neo/scripts/neostorage.py
View file @
ca75709f
...
...
@@ -30,6 +30,9 @@ parser.add_option('-d', '--database', help = 'database connections string')
parser
.
add_option
(
'-e'
,
'--engine'
,
help
=
'database engine'
)
parser
.
add_option
(
'-w'
,
'--wait'
,
help
=
'seconds to wait for backend to be '
'available, before erroring-out (-1 = infinite)'
,
type
=
'float'
,
default
=
0
)
parser
.
add_option
(
'--dedup'
,
action
=
'store_true'
,
help
=
'enable deduplication of data'
' when setting up a new storage node'
)
parser
.
add_option
(
'--disable-drop-partitions'
,
action
=
'store_true'
,
help
=
'do not delete data of discarded cells, which is'
' useful for big databases because the current'
...
...
neo/storage/app.py
View file @
ca75709f
...
...
@@ -69,7 +69,7 @@ class Application(BaseApplication):
# operation related data
self
.
operational
=
False
self
.
dm
.
setup
(
reset
=
config
.
getReset
())
self
.
dm
.
setup
(
reset
=
config
.
getReset
()
,
dedup
=
config
.
getDedup
()
)
self
.
loadConfiguration
()
# force node uuid from command line argument, for testing purpose only
...
...
neo/storage/database/importer.py
View file @
ca75709f
...
...
@@ -322,8 +322,8 @@ class ImporterDatabaseManager(DatabaseManager):
for
zodb
in
self
.
zodb
:
zodb
.
close
()
def
setup
(
self
,
reset
=
0
):
self
.
db
.
setup
(
reset
)
def
setup
(
self
,
reset
=
False
,
dedup
=
False
):
self
.
db
.
setup
(
reset
,
dedup
)
zodb_state
=
self
.
getConfiguration
(
"zodb"
)
if
zodb_state
:
logging
.
warning
(
"Ignoring configuration file for oid mapping."
...
...
neo/storage/database/manager.py
View file @
ca75709f
...
...
@@ -131,7 +131,7 @@ class DatabaseManager(object):
def
erase
(
self
):
""""""
def
_setup
(
self
):
def
_setup
(
self
,
dedup
=
False
):
"""To be overridden by the backend to set up a database
It must recover self._uncommitted_data from temporary object table.
...
...
@@ -142,14 +142,14 @@ class DatabaseManager(object):
"""
@
requires
(
_setup
)
def
setup
(
self
,
reset
=
0
):
def
setup
(
self
,
reset
=
False
,
dedup
=
False
):
"""Set up a database, discarding existing data first if reset is True
"""
if
reset
:
self
.
erase
()
self
.
_readable_set
=
set
()
self
.
_uncommitted_data
=
defaultdict
(
int
)
self
.
_setup
()
self
.
_setup
(
dedup
)
@
abstract
def
nonempty
(
self
,
table
):
...
...
neo/storage/database/mysqldb.py
View file @
ca75709f
...
...
@@ -172,7 +172,7 @@ class MySQLDatabaseManager(DatabaseManager):
if
e
.
args
[
0
]
!=
NO_SUCH_TABLE
:
raise
def
_setup
(
self
):
def
_setup
(
self
,
dedup
=
False
):
self
.
_config
.
clear
()
q
=
self
.
query
p
=
engine
=
self
.
_engine
...
...
@@ -240,9 +240,9 @@ class MySQLDatabaseManager(DatabaseManager):
id BIGINT UNSIGNED NOT NULL AUTO_INCREMENT PRIMARY KEY,
hash BINARY(20) NOT NULL,
compression TINYINT UNSIGNED NULL,
value MEDIUMBLOB NOT NULL
,
UNIQUE (hash, compression)
) ENGINE="""
+
engine
)
value MEDIUMBLOB NOT NULL
%s
) ENGINE=%s"""
%
(
""",
UNIQUE (hash, compression)"""
if
dedup
else
""
,
engine
)
)
q
(
"""CREATE TABLE IF NOT EXISTS bigdata (
id INT UNSIGNED NOT NULL AUTO_INCREMENT PRIMARY KEY,
...
...
neo/storage/database/sqlite.py
View file @
ca75709f
...
...
@@ -112,7 +112,7 @@ class SQLiteDatabaseManager(DatabaseManager):
if
not
e
.
args
[
0
].
startswith
(
"no such table:"
):
raise
def
_setup
(
self
):
def
_setup
(
self
,
dedup
=
False
):
# SQLite does support transactional Data Definition Language statements
# but unfortunately, the built-in Python binding automatically commits
# between such statements. This anti-feature causes this method to be
...
...
@@ -179,9 +179,10 @@ class SQLiteDatabaseManager(DatabaseManager):
compression INTEGER NOT NULL,
value BLOB NOT NULL)
"""
)
q
(
"""CREATE UNIQUE INDEX IF NOT EXISTS _data_i1 ON
data(hash, compression)
"""
)
if
dedup
:
q
(
"""CREATE UNIQUE INDEX IF NOT EXISTS _data_i1 ON
data(hash, compression)
"""
)
# The table "ttrans" stores information on uncommitted transactions.
q
(
"""CREATE TABLE IF NOT EXISTS ttrans (
...
...
neo/tests/storage/testStorageMySQL.py
View file @
ca75709f
...
...
@@ -39,7 +39,7 @@ class StorageMySQLdbTests(StorageDBTests):
self
.
assertEqual
(
db
.
db
,
DB_PREFIX
+
'0'
)
self
.
assertEqual
(
db
.
user
,
DB_USER
)
try
:
db
.
setup
(
reset
)
db
.
setup
(
reset
,
True
)
except
NotSupportedError
as
m
:
code
,
m
=
m
.
args
if
code
!=
UNKNOWN_STORAGE_ENGINE
:
...
...
neo/tests/storage/testStorageSQLite.py
View file @
ca75709f
...
...
@@ -27,7 +27,7 @@ class StorageSQLiteTests(StorageDBTests):
def
getDB
(
self
,
reset
=
0
):
db
=
SQLiteDatabaseManager
(
':memory:'
)
db
.
setup
(
reset
)
db
.
setup
(
reset
,
True
)
return
db
def
test_lockDatabase
(
self
):
...
...
neo/tests/threaded/__init__.py
View file @
ca75709f
...
...
@@ -652,7 +652,7 @@ class NEOCluster(object):
adapter
=
os
.
getenv
(
'NEO_TESTS_ADAPTER'
,
'SQLite'
),
storage_count
=
None
,
db_list
=
None
,
clear_databases
=
True
,
db_user
=
DB_USER
,
db_password
=
''
,
compress
=
True
,
importer
=
None
,
autostart
=
None
):
importer
=
None
,
autostart
=
None
,
dedup
=
False
):
self
.
name
=
'neo_%s'
%
self
.
_allocate
(
'name'
,
lambda
:
random
.
randint
(
0
,
100
))
self
.
compress
=
compress
...
...
@@ -661,7 +661,7 @@ class NEOCluster(object):
for
_
in
xrange
(
master_count
)]
self
.
master_nodes
=
' '
.
join
(
'%s:%s'
%
x
for
x
in
master_list
)
kw
=
Node
.
convertInitArgs
(
replicas
=
replicas
,
adapter
=
adapter
,
partitions
=
partitions
,
reset
=
clear_databases
)
partitions
=
partitions
,
reset
=
clear_databases
,
dedup
=
dedup
)
kw
[
'cluster'
]
=
weak_self
=
weakref
.
proxy
(
self
)
kw
[
'getSSL'
]
=
self
.
SSL
if
upstream
is
not
None
:
...
...
neo/tests/threaded/test.py
View file @
ca75709f
...
...
@@ -37,8 +37,8 @@ from neo.lib import logging
from
neo.lib.protocol
import
(
CellStates
,
ClusterStates
,
NodeStates
,
NodeTypes
,
Packets
,
Packet
,
uuid_str
,
ZERO_OID
,
ZERO_TID
,
MAX_TID
)
from
..
import
expectedFailure
,
unpickle_state
,
Patch
,
TransactionalResource
from
.
import
ClientApplication
,
ConnectionFilter
,
LockLock
,
NEO
ThreadedTest
,
\
RandomConflictDict
,
ThreadId
,
with_cluster
from
.
import
ClientApplication
,
ConnectionFilter
,
LockLock
,
NEO
Cluster
,
\
NEOThreadedTest
,
RandomConflictDict
,
ThreadId
,
with_cluster
from
neo.lib.util
import
add64
,
makeChecksum
,
p64
,
u64
from
neo.client.exception
import
NEOPrimaryMasterLost
,
NEOStorageError
from
neo.client.transactions
import
Transaction
...
...
@@ -198,9 +198,9 @@ class Test(NEOThreadedTest):
def
testUndoConflictDuringStore
(
self
,
cluster
):
self
.
_testUndoConflict
(
cluster
,
1
)
@
with_cluster
()
def
testStorageDataLock
(
self
,
cluster
)
:
if
1
:
def
testStorageDataLock
(
self
,
dedup
=
False
):
with
NEOCluster
(
dedup
=
dedup
)
as
cluster
:
cluster
.
start
()
storage
=
cluster
.
getZODBStorage
()
data_info
=
{}
...
...
@@ -212,8 +212,6 @@ class Test(NEOThreadedTest):
r1
=
storage
.
store
(
oid
,
None
,
data
,
''
,
txn
)
r2
=
storage
.
tpc_vote
(
txn
)
tid
=
storage
.
tpc_finish
(
txn
)
data_info
[
key
]
=
0
storage
.
sync
()
txn
=
[
transaction
.
Transaction
()
for
x
in
xrange
(
4
)]
for
t
in
txn
:
...
...
@@ -221,20 +219,20 @@ class Test(NEOThreadedTest):
storage
.
store
(
oid
if
tid
else
storage
.
new_oid
(),
tid
,
data
,
''
,
t
)
tid
=
None
data_info
[
key
]
=
4
s
torage
.
syn
c
()
data_info
[
key
]
=
4
if
dedup
else
1
s
elf
.
ti
c
()
self
.
assertEqual
(
data_info
,
cluster
.
storage
.
getDataLockInfo
())
storage
.
tpc_abort
(
txn
.
pop
())
for
t
in
txn
:
storage
.
tpc_vote
(
t
)
s
torage
.
syn
c
()
data_info
[
key
]
-=
1
s
elf
.
ti
c
()
data_info
[
key
]
-=
dedup
self
.
assertEqual
(
data_info
,
cluster
.
storage
.
getDataLockInfo
())
storage
.
tpc_abort
(
txn
[
1
])
s
torage
.
syn
c
()
data_info
[
key
]
-=
1
s
elf
.
ti
c
()
data_info
[
key
]
-=
dedup
self
.
assertEqual
(
data_info
,
cluster
.
storage
.
getDataLockInfo
())
tid1
=
storage
.
tpc_finish
(
txn
[
2
])
...
...
@@ -243,10 +241,13 @@ class Test(NEOThreadedTest):
self
.
assertEqual
(
data_info
,
cluster
.
storage
.
getDataLockInfo
())
storage
.
tpc_abort
(
txn
[
0
])
s
torage
.
syn
c
()
data_info
[
key
]
-=
1
s
elf
.
ti
c
()
data_info
[
key
]
-=
dedup
self
.
assertEqual
(
data_info
,
cluster
.
storage
.
getDataLockInfo
())
def
testStorageDataLockWithDeduplication
(
self
,
dedup
=
False
):
self
.
testStorageDataLock
(
True
)
@
with_cluster
()
def
testStorageDataLock2
(
self
,
cluster
):
storage
=
cluster
.
getZODBStorage
()
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment