一共有4台机器,各自挂接一个存储,希望实现:
尽量节约存储
高可用性
存储大量数据
配置方案:
每一台机器做一个分片的主数据库
每一台机器做一个分片的后备数据库
每一台机器做一个分片的仲裁服务
两个两个一组交叉作对方的后备
有三台机器开配置服务
有一台机器开路由服务(生产环境可以在每一台Windows App服务器上开路由服务,App服务器集群做负载均衡)
这样的话,任何一台服务器完全离线(或者交叉的两台服务器离线),都能保证整个系统正常运行。不过在服务器和服务器起来之后需要:
在升级成为主数据库的那个后备数据库上运行rs.StepDown(100)来让它让出主数据库的位置,因为每一个分片的活动数据库都应该由独立服务器担当,以获得最好的性能
配置服务和后备数据库起来之后不需要做任何调整
192.168.129.142
mkdir -p /usr/data/shard1
mkdir -p /usr/data/shard2
mkdir -p /usr/data/shard3
mkdir -p /usr/data/config1
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --shardsvr
--port 10001 --dbpath /usr/data/shard1/ --logpath
/usr/data/shard1/log.log --replSet shard1 --rest
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --shardsvr
--port 10002 --dbpath /usr/data/shard2/ --logpath
/usr/data/shard2/log.log --replSet shard2 --rest
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --shardsvr
--port 10003 --dbpath /usr/data/shard3/ --logpath
/usr/data/shard3/log.log --replSet shard3 --rest
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --configsvr
--port 20001 --dbpath /usr/data/config1/ --logpath
/usr/data/config1/log.log --rest
ps aux | grep mongodb | grep -v grep
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongo --port 10001
cOnfig= {_id: 'shard1', members: [
{_id: 0, host:
'192.168.129.142:10001'},
{_id: 1, host:
'192.168.129.172:10001'},
{_id: 2, host:
'192.168.129.173:10001', arbiterOnly: true}
]}
rs.initiate(config)
rs.status()
mkdir -p /usr/data/shard2
mkdir -p /usr/data/shard1
mkdir -p /usr/data/shard4
mkdir -p /usr/data/config2
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --shardsvr
--port 10002 --dbpath /usr/data/shard2/ --logpath
/usr/data/shard2/log.log --replSet shard2 --rest
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --shardsvr
--port 10001 --dbpath /usr/data/shard1/ --logpath
/usr/data/shard1/log.log --replSet shard1 --rest
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --shardsvr
--port 10004 --dbpath /usr/data/shard4/ --logpath
/usr/data/shard4/log.log --replSet shard4 --rest
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --configsvr
--port 20002 --dbpath /usr/data/config2/ --logpath
/usr/data/config2/log.log --rest
ps aux | grep mongodb | grep -v grep
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongo --port 10002
cOnfig= {_id: 'shard2', members: [
{_id: 0, host:
'192.168.129.172:10002'},
{_id: 1, host:
'192.168.129.142:10002'},
{_id: 2, host:
'192.168.129.175:10002', arbiterOnly: true}
]}
rs.initiate(config)
rs.status()
mkdir -p /usr/data/shard3
mkdir -p /usr/data/shard4
mkdir -p /usr/data/shard1
mkdir -p /usr/data/config3
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --shardsvr
--port 10003 --dbpath /usr/data/shard3/ --logpath
/usr/data/shard3/log.log --replSet shard3 --rest
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --shardsvr
--port 10004 --dbpath /usr/data/shard4/ --logpath
/usr/data/shard4/log.log --replSet shard4 --rest
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --shardsvr
--port 10001 --dbpath /usr/data/shard1/ --logpath
/usr/data/shard1/log.log --replSet shard1 --rest
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --configsvr
--port 20003 --dbpath /usr/data/config3/ --logpath
/usr/data/config3/log.log --rest
ps aux | grep mongodb | grep -v grep
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongo --port 10003
cOnfig= {_id: 'shard3', members: [
{_id: 0, host:
'192.168.129.173:10003'},
{_id: 1, host:
'192.168.129.175:10003'},
{_id: 2, host:
'192.168.129.142:10003', arbiterOnly: true}
]}
rs.initiate(config)
rs.status()
mkdir -p /usr/data/shard4
mkdir -p /usr/data/shard3
mkdir -p /usr/data/shard2
mkdir -p /usr/data/master
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --shardsvr
--port 10004 --dbpath /usr/data/shard4/ --logpath
/usr/data/shard4/log.log --replSet shard4 --rest
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --shardsvr
--port 10003 --dbpath /usr/data/shard3/ --logpath
/usr/data/shard3/log.log --replSet shard3 --rest
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongod --fork --shardsvr
--port 10002 --dbpath /usr/data/shard2/ --logpath
/usr/data/shard2/log.log --replSet shard2 --rest
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongos --fork --port
40000 --logpath /usr/data/master/log.log --chunkSize 1
"192.168.129.142:20001,192.168.129.172:20002,192.168.129.173:20003"
ps aux | grep mongodb | grep -v grep
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongo --port 10004
cOnfig= {_id: 'shard4', members: [
{_id: 0, host:
'192.168.129.175:10004'},
{_id: 1, host:
'192.168.129.173:10004'},
{_id: 2, host:
'192.168.129.172:10004', arbiterOnly: true}
]}
rs.initiate(config)
rs.status()
/usr/local/mongodb-linux-x86_64-1.6.4/bin/mongo --port 40000
use admin
db.runCommand({
addshard:'shard1/192.168.129.142:10001,192.168.129.172:10001'
})
db.runCommand({
addshard:'shard2/192.168.129.172:10002,192.168.129.142:10002'
})
db.runCommand({
addshard:'shard3/192.168.129.173:10003,192.168.129.175:10003'
})
db.runCommand({
addshard:'shard4/192.168.129.175:10004,192.168.129.173:10004'
})
db.runCommand({ listshards:1 })
db.runCommand({ enablesharding:'test' })
db.runCommand({ shardcollection:'test.data', key:{_id:1} })
printShardingStatus()
插入大量数据后的结果:
db.data.stats()
{
"sharded" : true,
"ns" : "test.data",
"count" : 1992002,
"size" : 2103555152,
"avgObjSize" : 1056.0005220878293,
"storageSize" : 2464232960,
"nindexes" : 1,
"nchunks" : 23,
"shards" : {
"shard1" : {
"ns" : "test.data",
"count" : 1271788,
"size" : 1343008448,
"avgObjSize" : 1056.0002516142627,
"storageSize" : 1568785152,
"numExtents" : 25,
"nindexes" : 1,
"lastExtentSize" : 267987712,
"paddingFactor" : 1,
"flags" : 1,
"totalIndexSize" : 52658176,
"indexSizes" : {
"_id_" : 52658176
},
"ok" : 1
},
"shard2" : {
"ns" : "test.data",
"count" : 98494,
"size" : 104009808,
"avgObjSize" : 1056.001462017991,
"storageSize" : 111137536,
"numExtents" : 12,
"nindexes" : 1,
"lastExtentSize" : 25047552,
"paddingFactor" : 1,
"flags" : 1,
"totalIndexSize" : 4087808,
"indexSizes" : {
"_id_" : 4087808
},
"ok" : 1
},
"shard3" : {
"ns" : "test.data",
"count" : 487410,
"size" : 514705248,
"avgObjSize" : 1056.000590878316,
"storageSize" : 607047424,
"numExtents" : 20,
"nindexes" : 1,
"lastExtentSize" : 107698688,
"paddingFactor" : 1,
"flags" : 1,
"totalIndexSize" : 20250624,
"indexSizes" : {
"_id_" : 20250624
},
"ok" : 1
},
"shard4" : {
"ns" : "test.data",
"count" : 134310,
"size" : 141831648,
"avgObjSize" : 1056.0021442930533,
"storageSize" : 177262848,
"numExtents" : 14,
"nindexes" : 1,
"lastExtentSize" : 36068352,
"paddingFactor" : 1,
"flags" : 1,
"totalIndexSize" : 5570560,
"indexSizes" : {
"_id_" : 5570560
},
"ok" : 1
}
},
"ok" : 1
}
printShardingStatus()
--- Sharding Status ---
sharding version: { "_id" : 1, "version" : 3 }
shards:
{
"_id" : "shard1",
"host" :
"shard1/192.168.129.142:10001,192.168.129.172:10001"
}
{
"_id" : "shard2",
"host" :
"shard2/192.168.129.172:10002,192.168.129.142:10002"
}
{
"_id" : "shard3",
"host" :
"shard3/192.168.129.173:10003,192.168.129.175:10003"
}
{
"_id" : "shard4",
"host" :
"shard4/192.168.129.175:10004,192.168.129.173:10004"
}
databases:
{ "_id" : "admin", "partitioned" : false, "primary" :
"config" }
{ "_id" : "test", "partitioned" : true, "primary" : "shard1"
}
test.data chunks:
{ "_id" : { $minKey : 1 } } -->> { "_id" :
ObjectId("4d01c5bc926adb17b8000001") } on : shard2 { "t" : 8000,
"i" : 0 }
{ "_id" : ObjectId("4d01c5bc926adb17b8000001") }
-->> { "_id" : ObjectId("4d01c620926adb17b800d1dd") } on :
shard2 { "t" : 10000, "i" : 0 }
{ "_id" : ObjectId("4d01c620926adb17b800d1dd") }
-->> { "_id" : ObjectId("4d01c669926adb17b80180bf") } on :
shard4 { "t" : 9000, "i" : 0 }
{ "_id" : ObjectId("4d01c669926adb17b80180bf") }
-->> { "_id" : ObjectId("4d01c6b6926adb17b8022fa1") } on :
shard2 { "t" : 12000, "i" : 0 }
{ "_id" : ObjectId("4d01c6b6926adb17b8022fa1") }
-->> { "_id" : ObjectId("4d01c6fd926adb17b802de83") } on :
shard1 { "t" : 5000, "i" : 1 }
{ "_id" : ObjectId("4d01c6fd926adb17b802de83") }
-->> { "_id" : ObjectId("4d01c74c926adb17b8038d65") } on :
shard4 { "t" : 11000, "i" : 0 }
{ "_id" : ObjectId("4d01c74c926adb17b8038d65") }
-->> { "_id" : ObjectId("4d01c795926adb17b8043c47") } on :
shard4 { "t" : 13000, "i" : 0 }
{ "_id" : ObjectId("4d01c795926adb17b8043c47") }
-->> { "_id" : ObjectId("4d01c7e6926adb17b804eb29") } on :
shard1 { "t" : 6000, "i" : 2 }
{ "_id" : ObjectId("4d01c7e6926adb17b804eb29") }
-->> { "_id" : ObjectId("4d01c82f926adb17b8059a0b") } on :
shard1 { "t" : 6000, "i" : 4 }
{ "_id" : ObjectId("4d01c82f926adb17b8059a0b") }
-->> { "_id" : ObjectId("4d01c8d4926adb17b806f7cf") } on :
shard1 { "t" : 12000, "i" : 1 }
{ "_id" : ObjectId("4d01c8d4926adb17b806f7cf") }
-->> { "_id" : ObjectId("4d01c963926adb17b8085593") } on :
shard3 { "t" : 7000, "i" : 2 }
{ "_id" : ObjectId("4d01c963926adb17b8085593") }
-->> { "_id" : ObjectId("4d01ca1c926adb17b809b357") } on :
shard3 { "t" : 7000, "i" : 4 }
{ "_id" : ObjectId("4d01ca1c926adb17b809b357") }
-->> { "_id" : ObjectId("4d01caf7926adb17b80b306a") } on :
shard3 { "t" : 7000, "i" : 6 }
{ "_id" : ObjectId("4d01caf7926adb17b80b306a") }
-->> { "_id" : ObjectId("4d01cbc2926adb17b80d09fd") } on :
shard3 { "t" : 13000, "i" : 2 }
{ "_id" : ObjectId("4d01cbc2926adb17b80d09fd") }
-->> { "_id" : ObjectId("4d01cc54926adb17b80e67c1") } on :
shard3 { "t" : 14000, "i" : 1 }
{ "_id" : ObjectId("4d01cc54926adb17b80e67c1") }
-->> { "_id" : ObjectId("4d01cec7926adb125c00d1dc") } on :
shard1 { "t" : 14000, "i" : 2 }
{ "_id" : ObjectId("4d01cec7926adb125c00d1dc") }
-->> { "_id" : ObjectId("4d01ced2926adb125c022fa0") } on :
shard1 { "t" : 14000, "i" : 4 }
{ "_id" : ObjectId("4d01ced2926adb125c022fa0") }
-->> { "_id" : ObjectId("4d01cedf926adb125c038d64") } on :
shard1 { "t" : 14000, "i" : 6 }
{ "_id" : ObjectId("4d01cedf926adb125c038d64") }
-->> { "_id" : ObjectId("4d01ceeb926adb125c04eb28") } on :
shard1 { "t" : 14000, "i" : 8 }
{ "_id" : ObjectId("4d01ceeb926adb125c04eb28") }
-->> { "_id" : ObjectId("4d01cf1a926adb125c07a6ab") } on :
shard1 { "t" : 14000, "i" : 10 }
{ "_id" : ObjectId("4d01cf1a926adb125c07a6ab") }
-->> { "_id" : ObjectId("4d01cf3c926adb125c0a622e") } on :
shard1 { "t" : 14000, "i" : 12 }
{ "_id" : ObjectId("4d01cf3c926adb125c0a622e") }
-->> { "_id" : ObjectId("4d01cf52926adb125c0d1db1") } on :
shard1 { "t" : 14000, "i" : 14 }
{ "_id" : ObjectId("4d01cf52926adb125c0d1db1") }
-->> { "_id" : ObjectId("4d01d58c926adb16480096f4") } on :
shard1 { "t" : 14000, "i" : 16 }
{ "_id" : ObjectId("4d01d58c926adb16480096f4") }
-->> { "_id" : { $maxKey : 1 } } on : shard1 { "t" : 14000,
"i" : 17 }
另,这套配置插入1万条1KB数据的时间大约在1.4秒,如果使用最简单单进程配置的话速度稍快,在1.2秒,性能下降不是很厉害,可以接受。
在这里我们配置路由服务1M数据作为一个分块,大约在10M数据量的时候,数据开始写入shard3,在500M数据量的时候,数据开始移到shard2和shard4。
经过测试发现达到1000万数据量之后,有sharding的数据库进行无索引查询耗时8秒(最大的sharding数据量在350万),而没有sharding的数据库耗时260秒…………