pymongo
from pymongo import MongoClient
client = MongoClient()
coll = client.db.collections
mongo
- aggregate
group 近似于 groupby
db.collections.aggregate([
{$match:
{'GENDER': 'F',
'DOB':
{ $gte: 19400801,
$lte: 20131231 } } },
{$group:
{_id: "$GENDER",
totalscore:{ $sum: 1}}}
])
- distinct
db.collections.distinct('key1', {'key2':'str chosen'})
# distinct(fields, {query}, {options})
- mongoexport
mongoexport -d database -c collection -f name, age -q '{"raw.category":"首页>图解"}' -o data.json
# 筛选fields 且当fields为dict时,有以下两种写法。
# 注意,仅可用于export成csv的情况!!!
mongoexport -d database -c collection -f '_id,raw.website,raw.category,raw_doc.metadata.institution' --type csv -o data.csv
mongoexport -d database -c collection -fieldFile files.txt --type csv -o data.csv
files.txt
_id
raw.website
raw.category
raw_doc.metadata.institution
【用于进入mongo之前】
- mongo 正则表达式
db.posts.find({post_text:{$regex:"runoob"}})