-
Notifications
You must be signed in to change notification settings - Fork 107
/
readme.txt
executable file
·40 lines (34 loc) · 1.87 KB
/
readme.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
用户基本信息表(user_base_info):
_id int, # 用户id,自增,非空
url string,
username string, # 用户名,如 zhouyuan
nickname string, # 昵称,如 周源
location string, # 居住地
industry string, # 行业,如 互联网
sex int, # 性别,1:男, 2:女, 0:未知
jobs [],
educations [],
description string, # 自我简介
sinaweibo string, # 新浪微博账号
tencentweibo string, # 腾讯微博账号
# qq string, # QQ号
ask_num int, # 提问数, 如 590
answer_num int, # 回答数,如 340
post_num int, # 专栏文章数, 如 3
collection_num int, # 收藏数,如 9
log_num int, # 编辑数,如14980
agree_num int, # 收到的赞同,如 15316
thank_num int, # 收到的感谢,如 3500
fav_num int, # 被收藏次数,如 9424
share_num int, # 被分享次数,如 922
followee_num int, # 关注数,如 1515
follower_num int, # 被关注数(粉丝),如 319529
update_time datetime # 信息更新时间,如 2014-05-17 11:15:00
db.zh_user.find({"industry":"高新科技"}).count()
db.zh_user.find({"industry":"互联网"}).count()
db.zh_user.find({"industry":"电子商务"}).count()
db.zh_user.find({"industry":"电子游戏"}).count()
db.zh_user.find({"industry":"计算机软件"}).count()
db.zh_user.find({"industry":"计算机硬件"}).count()
./mongoexport -d zhihu -c zh_user --csv -f _id,url,username,nickname,location,industry,sex,description,sinaweibo,tencentweibo,ask_num,answer_num,post_num,collection_num,log_num,agree_num,thank_num,fav_num,share_num,followee_num,follower_num,update_time --out ~/tmp/zh_user.csv
./mongoexport -d zhihu -c gh_user --csv -f _id,url,user_id,username,nickname,type,location,update_time,email,website,member_num,company,join_date,followee_num,follower_num,star_num,repo_num,org_num --out ~/tmp/gh_user.csv